{"id":"https://openalex.org/W4372266769","doi":"https://doi.org/10.1109/icassp49357.2023.10094684","title":"Vitasd: Robust Vision Transformer Baselines for Autism Spectrum Disorder Facial Diagnosis","display_name":"Vitasd: Robust Vision Transformer Baselines for Autism Spectrum Disorder Facial Diagnosis","publication_year":2023,"publication_date":"2023-05-05","ids":{"openalex":"https://openalex.org/W4372266769","doi":"https://doi.org/10.1109/icassp49357.2023.10094684"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49357.2023.10094684","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10094684","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100430970","display_name":"Xu Cao","orcid":"https://orcid.org/0000-0001-8739-5196"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Xu Cao","raw_affiliation_strings":["New York University,New York,USA","New York University, New York, USA"],"affiliations":[{"raw_affiliation_string":"New York University,New York,USA","institution_ids":["https://openalex.org/I57206974"]},{"raw_affiliation_string":"New York University, New York, USA","institution_ids":["https://openalex.org/I57206974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067298507","display_name":"Wenqian Ye","orcid":"https://orcid.org/0000-0002-6069-5153"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Wenqian Ye","raw_affiliation_strings":["New York University,New York,USA","New York University, New York, USA"],"affiliations":[{"raw_affiliation_string":"New York University,New York,USA","institution_ids":["https://openalex.org/I57206974"]},{"raw_affiliation_string":"New York University, New York, USA","institution_ids":["https://openalex.org/I57206974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085588558","display_name":"Elena Sizikova","orcid":"https://orcid.org/0009-0007-4422-6801"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Elena Sizikova","raw_affiliation_strings":["New York University,New York,USA","New York University, New York, USA"],"affiliations":[{"raw_affiliation_string":"New York University,New York,USA","institution_ids":["https://openalex.org/I57206974"]},{"raw_affiliation_string":"New York University, New York, USA","institution_ids":["https://openalex.org/I57206974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100781916","display_name":"Xue Bai","orcid":"https://orcid.org/0000-0001-9717-846X"},"institutions":[{"id":"https://openalex.org/I4210152664","display_name":"Shenzhen Children's Hospital","ror":"https://ror.org/0409k5a27","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210152664"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xue Bai","raw_affiliation_strings":["Shenzhen Children&#x2019;s Hospital,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Children&#x2019;s Hospital,Shenzhen,China","institution_ids":["https://openalex.org/I4210152664"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004271884","display_name":"Megan Coffee","orcid":"https://orcid.org/0000-0002-4581-111X"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Megan Coffee","raw_affiliation_strings":["NYU Grossman School of Medicine,New York,USA","NYU Grossman School of Medicine, New York, USA"],"affiliations":[{"raw_affiliation_string":"NYU Grossman School of Medicine,New York,USA","institution_ids":["https://openalex.org/I57206974"]},{"raw_affiliation_string":"NYU Grossman School of Medicine, New York, USA","institution_ids":["https://openalex.org/I57206974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070424376","display_name":"Hongwu Zeng","orcid":"https://orcid.org/0000-0002-7832-3702"},"institutions":[{"id":"https://openalex.org/I4210152664","display_name":"Shenzhen Children's Hospital","ror":"https://ror.org/0409k5a27","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210152664"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongwu Zeng","raw_affiliation_strings":["Shenzhen Children&#x2019;s Hospital,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Children&#x2019;s Hospital,Shenzhen,China","institution_ids":["https://openalex.org/I4210152664"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5008734591","display_name":"Jianguo Cao","orcid":"https://orcid.org/0000-0001-8781-5365"},"institutions":[{"id":"https://openalex.org/I4210152664","display_name":"Shenzhen Children's Hospital","ror":"https://ror.org/0409k5a27","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210152664"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianguo Cao","raw_affiliation_strings":["Shenzhen Children&#x2019;s Hospital,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Children&#x2019;s Hospital,Shenzhen,China","institution_ids":["https://openalex.org/I4210152664"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5100430970"],"corresponding_institution_ids":["https://openalex.org/I57206974"],"apc_list":null,"apc_paid":null,"fwci":6.6711,"has_fulltext":false,"cited_by_count":26,"citation_normalized_percentile":{"value":0.9725789,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11707","display_name":"Gaze Tracking and Assistive Technology","score":0.9897000193595886,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11094","display_name":"Face Recognition and Perception","score":0.9829000234603882,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autism-spectrum-disorder","display_name":"Autism spectrum disorder","score":0.667968213558197},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.561069667339325},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.45781368017196655},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4577753245830536},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.44262567162513733},{"id":"https://openalex.org/keywords/autism","display_name":"Autism","score":0.43421459197998047},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.331601083278656},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.20429879426956177},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.12362396717071533},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.0773969292640686},{"id":"https://openalex.org/keywords/developmental-psychology","display_name":"Developmental psychology","score":0.07662004232406616}],"concepts":[{"id":"https://openalex.org/C2778538070","wikidata":"https://www.wikidata.org/wiki/Q1436063","display_name":"Autism spectrum disorder","level":3,"score":0.667968213558197},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.561069667339325},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.45781368017196655},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4577753245830536},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.44262567162513733},{"id":"https://openalex.org/C205778803","wikidata":"https://www.wikidata.org/wiki/Q38404","display_name":"Autism","level":2,"score":0.43421459197998047},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.331601083278656},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.20429879426956177},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12362396717071533},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0773969292640686},{"id":"https://openalex.org/C138496976","wikidata":"https://www.wikidata.org/wiki/Q175002","display_name":"Developmental psychology","level":1,"score":0.07662004232406616},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49357.2023.10094684","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10094684","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W2101436791","https://openalex.org/W2745497104","https://openalex.org/W2912501419","https://openalex.org/W2920946364","https://openalex.org/W3009329175","https://openalex.org/W3091624500","https://openalex.org/W3094502228","https://openalex.org/W3164024107","https://openalex.org/W3173026327","https://openalex.org/W3210155031","https://openalex.org/W4205175089","https://openalex.org/W4211049957","https://openalex.org/W4214539404","https://openalex.org/W4223436232","https://openalex.org/W4226247407","https://openalex.org/W4286223290","https://openalex.org/W4291722303","https://openalex.org/W4297775537","https://openalex.org/W4312453657","https://openalex.org/W4313156423","https://openalex.org/W4321349965","https://openalex.org/W6737664043","https://openalex.org/W6742835484","https://openalex.org/W6784333009","https://openalex.org/W6795475546","https://openalex.org/W6797080668"],"related_works":["https://openalex.org/W4280602684","https://openalex.org/W4310092953","https://openalex.org/W2227393071","https://openalex.org/W4402326599","https://openalex.org/W1995350144","https://openalex.org/W2082102603","https://openalex.org/W2166141227","https://openalex.org/W3133980636","https://openalex.org/W4378085486","https://openalex.org/W4366602711"],"abstract_inverted_index":{"Autism":[0],"spectrum":[1],"disorder":[2,8],"(ASD)":[3],"is":[4],"a":[5,33,78,90,94,132],"lifelong":[6],"neurodevelopmental":[7],"with":[9,93],"very":[10],"high":[11],"prevalence":[12],"around":[13],"the":[14,19,43,46,51,100,121,129],"world.":[15],"Research":[16],"progress":[17],"in":[18,25,124],"field":[20],"of":[21,35,45,54,120],"ASD":[22,103,110,125],"facial":[23,67,111,126],"analysis":[24,53,112],"pediatric":[26,55],"patients":[27],"has":[28],"been":[29],"hindered":[30],"due":[31],"to":[32,81,98],"lack":[34],"well-established":[36],"baselines.":[37],"In":[38],"this":[39],"paper,":[40],"we":[41],"propose":[42],"use":[44],"Vision":[47],"Transformer":[48],"(ViT)":[49],"for":[50,102],"computational":[52],"ASD.":[56],"The":[57],"presented":[58],"model,":[59],"known":[60],"as":[61],"ViTASD,":[62],"distills":[63],"knowledge":[64],"from":[65,84],"large":[66],"expression":[68],"datasets":[69],"and":[70,88,137],"offers":[71],"model":[72],"structure":[73],"transferability.":[74],"Specifically,":[75],"ViTASD":[76],"employs":[77],"vanilla":[79],"ViT":[80],"extract":[82],"features":[83],"patients\u2019":[85],"face":[86],"images":[87],"adopts":[89],"lightweight":[91],"decoder":[92],"Gaussian":[95],"Process":[96],"layer":[97],"enhance":[99],"robustness":[101],"analysis.":[104],"Extensive":[105],"experiments":[106],"conducted":[107],"on":[108],"standard":[109],"benchmarks":[113],"show":[114],"that":[115],"our":[116],"method":[117],"outperforms":[118],"all":[119],"representative":[122],"approaches":[123],"analysis,":[127],"while":[128],"ViTASD-L":[130],"achieves":[131],"new":[133],"state-of-the-art.":[134],"Our":[135],"code":[136],"pretrained":[138],"models":[139],"are":[140],"available":[141],"at":[142],"https://github.com/IrohXu/ViTASD.":[143]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":7}],"updated_date":"2026-04-01T17:29:45.350535","created_date":"2025-10-10T00:00:00"}
