{"id":"https://openalex.org/W4394726579","doi":"https://doi.org/10.1142/s0218001424590043","title":"Representation Learning Based on Vision Transformer","display_name":"Representation Learning Based on Vision Transformer","publication_year":2024,"publication_date":"2024-04-11","ids":{"openalex":"https://openalex.org/W4394726579","doi":"https://doi.org/10.1142/s0218001424590043"},"language":"en","primary_location":{"id":"doi:10.1142/s0218001424590043","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s0218001424590043","pdf_url":null,"source":{"id":"https://openalex.org/S41486457","display_name":"International Journal of Pattern Recognition and Artificial Intelligence","issn_l":"0218-0014","issn":["0218-0014","1793-6381"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Pattern Recognition and Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5095373071","display_name":"Ruisheng Ran","orcid":null},"institutions":[{"id":"https://openalex.org/I126924076","display_name":"Chongqing Normal University","ror":"https://ror.org/01dcw5w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I126924076"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ruisheng Ran","raw_affiliation_strings":["The College of Computer and Information Science, Chongqing Normal University, Chongqing 401331, P. R. China"],"affiliations":[{"raw_affiliation_string":"The College of Computer and Information Science, Chongqing Normal University, Chongqing 401331, P. R. China","institution_ids":["https://openalex.org/I126924076"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033296587","display_name":"Tianyu Gao","orcid":"https://orcid.org/0000-0002-1860-7252"},"institutions":[{"id":"https://openalex.org/I126924076","display_name":"Chongqing Normal University","ror":"https://ror.org/01dcw5w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I126924076"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tianyu Gao","raw_affiliation_strings":["The College of Computer and Information Science, Chongqing Normal University, Chongqing 401331, P. R. China"],"affiliations":[{"raw_affiliation_string":"The College of Computer and Information Science, Chongqing Normal University, Chongqing 401331, P. R. China","institution_ids":["https://openalex.org/I126924076"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102633531","display_name":"Qianwei Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qianwei Hu","raw_affiliation_strings":["Chongqing Dinghui Information Technology Co., Ltd., Chongqing 401147, P. R. China"],"affiliations":[{"raw_affiliation_string":"Chongqing Dinghui Information Technology Co., Ltd., Chongqing 401147, P. R. China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061246177","display_name":"Wenfeng Zhang","orcid":"https://orcid.org/0009-0003-2079-993X"},"institutions":[{"id":"https://openalex.org/I126924076","display_name":"Chongqing Normal University","ror":"https://ror.org/01dcw5w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I126924076"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenfeng Zhang","raw_affiliation_strings":["The College of Computer and Information Science, Chongqing Normal University, Chongqing 401331, P. R. China"],"affiliations":[{"raw_affiliation_string":"The College of Computer and Information Science, Chongqing Normal University, Chongqing 401331, P. R. China","institution_ids":["https://openalex.org/I126924076"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101602318","display_name":"Shunshun Peng","orcid":"https://orcid.org/0000-0003-1887-0592"},"institutions":[{"id":"https://openalex.org/I126924076","display_name":"Chongqing Normal University","ror":"https://ror.org/01dcw5w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I126924076"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shunshun Peng","raw_affiliation_strings":["The College of Computer and Information Science, Chongqing Normal University, Chongqing 401331, P. R. China"],"affiliations":[{"raw_affiliation_string":"The College of Computer and Information Science, Chongqing Normal University, Chongqing 401331, P. R. China","institution_ids":["https://openalex.org/I126924076"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101627689","display_name":"Bin Fang","orcid":"https://orcid.org/0000-0003-3257-3033"},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bin Fang","raw_affiliation_strings":["The College of Computer Science, Chongqing University, Chongqing 400044, P. R. China"],"affiliations":[{"raw_affiliation_string":"The College of Computer Science, Chongqing University, Chongqing 400044, P. R. China","institution_ids":["https://openalex.org/I158842170"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5095373071"],"corresponding_institution_ids":["https://openalex.org/I126924076"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.03717365,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"38","issue":"07","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11775","display_name":"COVID-19 diagnosis using AI","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7532899975776672},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.690784215927124},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6756502389907837},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.6156354546546936},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5574032664299011},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.4751710295677185},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.46467334032058716},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.43493354320526123},{"id":"https://openalex.org/keywords/data-redundancy","display_name":"Data redundancy","score":0.4264974594116211},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.41840147972106934},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4090038537979126}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7532899975776672},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.690784215927124},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6756502389907837},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.6156354546546936},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5574032664299011},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.4751710295677185},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.46467334032058716},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.43493354320526123},{"id":"https://openalex.org/C7545210","wikidata":"https://www.wikidata.org/wiki/Q838123","display_name":"Data redundancy","level":2,"score":0.4264974594116211},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41840147972106934},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4090038537979126},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1142/s0218001424590043","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s0218001424590043","pdf_url":null,"source":{"id":"https://openalex.org/S41486457","display_name":"International Journal of Pattern Recognition and Artificial Intelligence","issn_l":"0218-0014","issn":["0218-0014","1793-6381"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Pattern Recognition and Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6506172023","display_name":null,"funder_award_id":"61876026","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W1498436455","https://openalex.org/W1535602073","https://openalex.org/W1616262590","https://openalex.org/W1975056068","https://openalex.org/W2002454301","https://openalex.org/W2025768430","https://openalex.org/W2044913453","https://openalex.org/W2070148066","https://openalex.org/W2100495367","https://openalex.org/W2128728535","https://openalex.org/W2143784448","https://openalex.org/W2163922914","https://openalex.org/W2171061940","https://openalex.org/W2194775991","https://openalex.org/W2213612645","https://openalex.org/W2334493732","https://openalex.org/W2404498690","https://openalex.org/W2557864411","https://openalex.org/W2611632661","https://openalex.org/W2618530766","https://openalex.org/W2663800299","https://openalex.org/W2747680751","https://openalex.org/W2799215068","https://openalex.org/W2887567284","https://openalex.org/W2888198675","https://openalex.org/W2906666325","https://openalex.org/W2910603373","https://openalex.org/W2962898354","https://openalex.org/W2962949934","https://openalex.org/W2963499153","https://openalex.org/W2964086552","https://openalex.org/W3000409346","https://openalex.org/W3015646845","https://openalex.org/W3034730995","https://openalex.org/W3035414587","https://openalex.org/W3046428525","https://openalex.org/W3102431071","https://openalex.org/W3110144845","https://openalex.org/W3113767342","https://openalex.org/W3119687891","https://openalex.org/W3131860561","https://openalex.org/W3143107425","https://openalex.org/W3194481141","https://openalex.org/W3199528201","https://openalex.org/W3214066484","https://openalex.org/W4313156423","https://openalex.org/W4318677156","https://openalex.org/W4378649427","https://openalex.org/W4386076522"],"related_works":["https://openalex.org/W4296209631","https://openalex.org/W2561617217","https://openalex.org/W2025378473","https://openalex.org/W4390516098","https://openalex.org/W2355801475","https://openalex.org/W2181948922","https://openalex.org/W2384362569","https://openalex.org/W4206659427","https://openalex.org/W2170062176","https://openalex.org/W2148135840"],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"with":[3,133],"the":[4,10,44,72,83,101,111,116,138,143,149],"rapid":[5],"development":[6],"of":[7,12,26,79,85,115,145,151],"information":[8],"technology,":[9],"volume":[11],"image":[13,86,107,125],"data":[14,123],"has":[15,48],"grown":[16],"exponentially.":[17],"However,":[18],"these":[19],"datasets":[20],"typically":[21],"contain":[22],"a":[23,38,67],"large":[24],"amount":[25],"redundant":[27,89],"information.":[28],"To":[29],"extract":[30],"effective":[31],"features":[32],"and":[33,51,91,100,129],"reduce":[34,82],"redundancy":[35],"from":[36],"images,":[37],"representation":[39,112,135,152],"learning":[40,62,113,136],"method":[41,65,118,147],"based":[42],"on":[43],"Vision":[45],"Transformer":[46,56],"(ViT)":[47],"been":[49],"proposed,":[50],"to":[52,60,81],"our":[53],"best":[54],"knowledge,":[55],"was":[57],"first":[58],"applied":[59],"zero-shot":[61],"(ZSL).":[63],"The":[64],"adopts":[66],"symmetric":[68],"encoder\u2013decoder":[69],"structure,":[70],"where":[71],"encoder":[73],"incorporates":[74],"Multi-Head":[75],"Self-Attention":[76],"(MSA)":[77],"mechanism":[78],"ViT":[80],"dimensionality":[84],"features,":[87,99],"eliminate":[88],"information,":[90],"decrease":[92],"computational":[93],"burden.":[94],"Consequently,":[95],"it":[96],"effectively":[97],"extracts":[98],"decoder":[102],"is":[103],"utilized":[104],"for":[105],"reconstructing":[106],"data.":[108],"We":[109],"evaluated":[110],"capability":[114],"proposed":[117],"in":[119,148],"various":[120],"tasks,":[121],"including":[122],"visualization,":[124],"reconstruction,":[126],"face":[127],"recognition,":[128],"ZSL.":[130],"By":[131],"comparing":[132],"state-of-the-art":[134],"methods,":[137],"outstanding":[139],"results":[140],"obtained":[141],"validate":[142],"effectiveness":[144],"this":[146],"field":[150],"learning.":[153]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
