{"id":"https://openalex.org/W7138214591","doi":"https://doi.org/10.1609/aaai.v40i6.42425","title":"A Theory-Inspired Framework for Few-Shot Cross-Modal Sketch Person Re-Identification","display_name":"A Theory-Inspired Framework for Few-Shot Cross-Modal Sketch Person Re-Identification","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138214591","doi":"https://doi.org/10.1609/aaai.v40i6.42425"},"language":null,"primary_location":{"id":"doi:10.1609/aaai.v40i6.42425","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i6.42425","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1609/aaai.v40i6.42425","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026737465","display_name":"Yunpeng Gong","orcid":"https://orcid.org/0000-0002-6498-2555"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yunpeng Gong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129711118","display_name":"Yongjie Hou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yongjie Hou","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033892804","display_name":"Jiangming Shi","orcid":"https://orcid.org/0000-0003-3817-0497"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiangming Shi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129693115","display_name":"Kim Long Diep","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim Long Diep","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129735286","display_name":"Min Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Min Jiang","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5026737465"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.54213274,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"40","issue":"6","first_page":"4284","last_page":"4292"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.5942000150680542,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.5942000150680542,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.19269999861717224,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12740","display_name":"Gait Recognition and Analysis","score":0.11190000176429749,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sketch","display_name":"Sketch","score":0.8948000073432922},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6276000142097473},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.5016000270843506},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.43650001287460327},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.4309000074863434},{"id":"https://openalex.org/keywords/perturbation","display_name":"Perturbation (astronomy)","score":0.35659998655319214},{"id":"https://openalex.org/keywords/sketch-recognition","display_name":"Sketch recognition","score":0.32589998841285706}],"concepts":[{"id":"https://openalex.org/C2779231336","wikidata":"https://www.wikidata.org/wiki/Q7534724","display_name":"Sketch","level":2,"score":0.8948000073432922},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6876000165939331},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6276000142097473},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6068999767303467},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.5016000270843506},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4424999952316284},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.43650001287460327},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.4309000074863434},{"id":"https://openalex.org/C177918212","wikidata":"https://www.wikidata.org/wiki/Q803623","display_name":"Perturbation (astronomy)","level":2,"score":0.35659998655319214},{"id":"https://openalex.org/C132900626","wikidata":"https://www.wikidata.org/wiki/Q7534733","display_name":"Sketch recognition","level":4,"score":0.32589998841285706},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3158000111579895},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.3140000104904175},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2973000109195709},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.29660001397132874},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.2824000120162964},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.2809999883174896},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2711000144481659},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.262800008058548},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2538999915122986},{"id":"https://openalex.org/C2776960227","wikidata":"https://www.wikidata.org/wiki/Q2586354","display_name":"Knowledge transfer","level":2,"score":0.2531999945640564}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v40i6.42425","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i6.42425","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i6.42425","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i6.42425","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Sketch-based":[0],"person":[1],"re-identification":[2],"aims":[3],"to":[4,16,70,85,128],"match":[5],"hand-drawn":[6],"sketches":[7],"with":[8],"RGB":[9,126],"surveillance":[10],"images,":[11],"but":[12],"remains":[13],"challenging":[14],"due":[15],"severe":[17],"modality":[18,71,106],"gaps":[19],"and":[20,59,62,89,93,108],"limited":[21],"labeled":[22],"data.":[23],"To":[24],"address":[25],"this,":[26],"we":[27,42,74],"propose":[28],"KTCAA,":[29],"a":[30,117],"theoretically":[31],"inspired":[32],"framework":[33],"for":[34],"few-shot":[35],"cross-modal":[36],"generalization.":[37],"Drawing":[38],"on":[39,132],"generalization":[40],"bounds,":[41],"identify":[43],"two":[44],"key":[45],"factors":[46],"affecting":[47],"target":[48,60,87],"risk:":[49],"(1)":[50,76],"domain":[51],"discrepancy,":[52],"reflecting":[53],"the":[54,67],"alignment":[55,122],"difficulty":[56],"between":[57],"source":[58],"distributions;":[61],"(2)":[63,94],"perturbation":[64,101],"invariance,":[65],"measuring":[66],"model\u2019s":[68],"robustness":[69],"shifts.":[72],"Accordingly,":[73],"design:":[75],"Alignment":[77],"Augmentation":[78],"(AA),":[79],"which":[80,99],"applies":[81],"localized":[82],"sketch-style":[83],"transformations":[84],"simulate":[86],"distributions":[88],"guide":[90],"progressive":[91],"alignment;":[92],"Knowledge":[95],"Transfer":[96],"Catalyst":[97],"(KTC),":[98],"enhances":[100],"invariance":[102],"by":[103],"introducing":[104],"worst-case":[105],"perturbations":[107],"enforcing":[109],"consistency.":[110],"These":[111],"modules":[112],"are":[113],"jointly":[114],"optimized":[115],"within":[116],"meta-learning":[118],"paradigm":[119],"that":[120,136],"transfers":[121],"knowledge":[123],"from":[124],"data-abundant":[125],"domains":[127],"sketch":[129],"scenarios.":[130],"Experiments":[131],"multiple":[133],"benchmarks":[134],"show":[135],"KTCAA":[137],"achieves":[138],"state-of-the-art":[139],"performance,":[140],"particularly":[141],"under":[142],"data-scarce":[143],"conditions.":[144]},"counts_by_year":[],"updated_date":"2026-03-18T06:31:55.123368","created_date":"2026-03-18T00:00:00"}
