{"id":"https://openalex.org/W7126261665","doi":"https://doi.org/10.1109/access.2026.3659732","title":"Vi-SketchGPT: A Novel Multi-Scale and Context-Aware Representation for Sketch Generation and Classification","display_name":"Vi-SketchGPT: A Novel Multi-Scale and Context-Aware Representation for Sketch Generation and Classification","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7126261665","doi":"https://doi.org/10.1109/access.2026.3659732"},"language":"en","primary_location":{"id":"doi:10.1109/access.2026.3659732","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2026.3659732","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2026.3659732","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113341684","display_name":"Giulio Federico","orcid":null},"institutions":[{"id":"https://openalex.org/I122991210","display_name":"Istituto di Scienza e Tecnologie dell'Informazione \"Alessandro Faedo\"","ror":"https://ror.org/05kacka20","country_code":"IT","type":"facility","lineage":["https://openalex.org/I122991210","https://openalex.org/I4210155236"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Giulio Federico","raw_affiliation_strings":["Institute of Information Science and Technologies (ISTI-CNR), Pisa, Italy"],"affiliations":[{"raw_affiliation_string":"Institute of Information Science and Technologies (ISTI-CNR), Pisa, Italy","institution_ids":["https://openalex.org/I122991210"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103162338","display_name":"Giuseppe Amato","orcid":null},"institutions":[{"id":"https://openalex.org/I122991210","display_name":"Istituto di Scienza e Tecnologie dell'Informazione \"Alessandro Faedo\"","ror":"https://ror.org/05kacka20","country_code":"IT","type":"facility","lineage":["https://openalex.org/I122991210","https://openalex.org/I4210155236"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Giuseppe Amato","raw_affiliation_strings":["Institute of Information Science and Technologies (ISTI-CNR), Pisa, Italy"],"affiliations":[{"raw_affiliation_string":"Institute of Information Science and Technologies (ISTI-CNR), Pisa, Italy","institution_ids":["https://openalex.org/I122991210"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121131835","display_name":"Fabio Carrara","orcid":null},"institutions":[{"id":"https://openalex.org/I122991210","display_name":"Istituto di Scienza e Tecnologie dell'Informazione \"Alessandro Faedo\"","ror":"https://ror.org/05kacka20","country_code":"IT","type":"facility","lineage":["https://openalex.org/I122991210","https://openalex.org/I4210155236"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Fabio Carrara","raw_affiliation_strings":["Institute of Information Science and Technologies (ISTI-CNR), Pisa, Italy"],"affiliations":[{"raw_affiliation_string":"Institute of Information Science and Technologies (ISTI-CNR), Pisa, Italy","institution_ids":["https://openalex.org/I122991210"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072879702","display_name":"Claudio Gennaro","orcid":null},"institutions":[{"id":"https://openalex.org/I122991210","display_name":"Istituto di Scienza e Tecnologie dell'Informazione \"Alessandro Faedo\"","ror":"https://ror.org/05kacka20","country_code":"IT","type":"facility","lineage":["https://openalex.org/I122991210","https://openalex.org/I4210155236"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Claudio Gennaro","raw_affiliation_strings":["Institute of Information Science and Technologies (ISTI-CNR), Pisa, Italy"],"affiliations":[{"raw_affiliation_string":"Institute of Information Science and Technologies (ISTI-CNR), Pisa, Italy","institution_ids":["https://openalex.org/I122991210"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052859496","display_name":"Marco Di Benedetto","orcid":null},"institutions":[{"id":"https://openalex.org/I122991210","display_name":"Istituto di Scienza e Tecnologie dell'Informazione \"Alessandro Faedo\"","ror":"https://ror.org/05kacka20","country_code":"IT","type":"facility","lineage":["https://openalex.org/I122991210","https://openalex.org/I4210155236"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Marco Di Benedetto","raw_affiliation_strings":["Institute of Information Science and Technologies (ISTI-CNR), Pisa, Italy"],"affiliations":[{"raw_affiliation_string":"Institute of Information Science and Technologies (ISTI-CNR), Pisa, Italy","institution_ids":["https://openalex.org/I122991210"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5113341684"],"corresponding_institution_ids":["https://openalex.org/I122991210"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.3121936,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"14","issue":null,"first_page":"17760","last_page":"17773"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.15690000355243683,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.15690000355243683,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11904","display_name":"Spatial Cognition and Navigation","score":0.14249999821186066,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10789","display_name":"Interactive and Immersive Displays","score":0.10270000249147415,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sketch","display_name":"Sketch","score":0.7590000033378601},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.616100013256073},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.5091000199317932},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.46650001406669617},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.40700000524520874},{"id":"https://openalex.org/keywords/rendering","display_name":"Rendering (computer graphics)","score":0.36899998784065247},{"id":"https://openalex.org/keywords/spatial-analysis","display_name":"Spatial analysis","score":0.33959999680519104},{"id":"https://openalex.org/keywords/abstraction","display_name":"Abstraction","score":0.336899995803833},{"id":"https://openalex.org/keywords/intuition","display_name":"Intuition","score":0.3325999975204468}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8144999742507935},{"id":"https://openalex.org/C2779231336","wikidata":"https://www.wikidata.org/wiki/Q7534724","display_name":"Sketch","level":2,"score":0.7590000033378601},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.616100013256073},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5982000231742859},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.5091000199317932},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.46650001406669617},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.40700000524520874},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.36899998784065247},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.35679998993873596},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3402000069618225},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.33959999680519104},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.336899995803833},{"id":"https://openalex.org/C132010649","wikidata":"https://www.wikidata.org/wiki/Q189222","display_name":"Intuition","level":2,"score":0.3325999975204468},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2955000102519989},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2946999967098236},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.28850001096725464},{"id":"https://openalex.org/C132900626","wikidata":"https://www.wikidata.org/wiki/Q7534733","display_name":"Sketch recognition","level":4,"score":0.2865999937057495},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.2831000089645386},{"id":"https://openalex.org/C27511587","wikidata":"https://www.wikidata.org/wiki/Q2178623","display_name":"Spatial relation","level":2,"score":0.2743000090122223},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.27250000834465027},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.26330000162124634},{"id":"https://openalex.org/C61423126","wikidata":"https://www.wikidata.org/wiki/Q187432","display_name":"Scripting language","level":2,"score":0.2621999979019165},{"id":"https://openalex.org/C172367668","wikidata":"https://www.wikidata.org/wiki/Q6504956","display_name":"Data visualization","level":3,"score":0.26089999079704285},{"id":"https://openalex.org/C171018156","wikidata":"https://www.wikidata.org/wiki/Q7370306","display_name":"Rotation formalisms in three dimensions","level":2,"score":0.2596000134944916},{"id":"https://openalex.org/C161301231","wikidata":"https://www.wikidata.org/wiki/Q3478658","display_name":"Knowledge representation and reasoning","level":2,"score":0.2558000087738037},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.25529998540878296},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.2515000104904175},{"id":"https://openalex.org/C527412718","wikidata":"https://www.wikidata.org/wiki/Q855395","display_name":"Interpretation (philosophy)","level":2,"score":0.2506999969482422}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/access.2026.3659732","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2026.3659732","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:dnet:iris________::297618ff264156ae9fcfb569428ed6eb","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S7407055261","display_name":"ISTI Open Portal","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE ACCESS","raw_type":"Journal article"},{"id":"pmh:oai:doaj.org/article:649e7b82a2c14d3bbb0fe83899809f9a","is_oa":true,"landing_page_url":"https://doaj.org/article/649e7b82a2c14d3bbb0fe83899809f9a","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 14, Pp 17760-17773 (2026)","raw_type":"article"},{"id":"pmh:oai:zenodo.org:17338722","is_oa":true,"landing_page_url":"https://doi.org/10.1109/ACCESS.2026.3659732","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, 14, 17760-17773, (2026-01-30)","raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"doi:10.1109/access.2026.3659732","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2026.3659732","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.44693928956985474,"id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W1972420097","https://openalex.org/W2027125558","https://openalex.org/W2064675550","https://openalex.org/W2125635584","https://openalex.org/W2151103935","https://openalex.org/W2153404544","https://openalex.org/W2185824196","https://openalex.org/W2194775991","https://openalex.org/W2294927362","https://openalex.org/W2467281799","https://openalex.org/W2471581439","https://openalex.org/W2474425887","https://openalex.org/W2523894284","https://openalex.org/W2549858052","https://openalex.org/W2776402438","https://openalex.org/W2805097687","https://openalex.org/W2890627175","https://openalex.org/W2899102889","https://openalex.org/W2904759000","https://openalex.org/W2941405440","https://openalex.org/W2963307918","https://openalex.org/W2963446712","https://openalex.org/W2963703957","https://openalex.org/W2964036047","https://openalex.org/W2964266708","https://openalex.org/W2965072550","https://openalex.org/W2979237919","https://openalex.org/W2981922830","https://openalex.org/W3035035925","https://openalex.org/W3035058753","https://openalex.org/W3093027278","https://openalex.org/W3095075928","https://openalex.org/W3099716136","https://openalex.org/W3107824324","https://openalex.org/W3138516171","https://openalex.org/W3150584131","https://openalex.org/W3177383578","https://openalex.org/W3187403570","https://openalex.org/W4312443924","https://openalex.org/W4385245566","https://openalex.org/W4393308399","https://openalex.org/W4402343084","https://openalex.org/W4402727407","https://openalex.org/W4402754147","https://openalex.org/W4413144360"],"related_works":[],"abstract_inverted_index":{"Human":[0],"sketches":[1,35,167],"exhibit":[2],"substantial":[3],"variability":[4],"across":[5],"individuals":[6],"in":[7,191],"terms":[8],"of":[9,40,45,52,61,100,108,189],"line":[10],"style,":[11],"abstraction":[12],"level":[13],"and":[14,25,33,59,78,91,130,152,159,181],"drawing":[15],"conventions.":[16],"Unlike":[17],"realistic":[18],"images,":[19],"they":[20],"provide":[21],"limited":[22],"contextual":[23],"information":[24,190],"rely":[26],"on":[27,156],"highly":[28],"simplified":[29],"concept":[30],"representations.":[31],"Recognizing":[32],"generating":[34,172],"therefore":[36],"requires":[37],"efficient":[38],"use":[39],"the":[41,46,62,67,89,101,106,109,145,157,164,187,192],"available":[42],"information,":[43,112,124],"identification":[44],"most":[47],"informative":[48],"local":[49,84],"features,":[50,85],"interpretation":[51],"their":[53],"meaning":[54],"within":[55,88],"a":[56,76,97,134],"minimal":[57],"context,":[58],"understanding":[60,99],"spatial":[63,93],"relationships":[64],"that":[65,80,163,174],"define":[66],"overall":[68],"structure.":[69,103],"In":[70],"this":[71,121],"study,":[72],"we":[73,113],"introduce":[74],"ViSketch-GPT,":[75],"representation":[77,143],"model":[79,146,165],"can":[81],"extract":[82],"these":[83],"contextualize":[86],"them":[87],"sketch":[90,102],"encode":[92],"relationships,":[94,180],"thereby":[95],"enabling":[96],"deeper":[98],"Guided":[104],"by":[105],"intuition":[107],"void":[110],"as":[111],"leverage":[114],"Signed":[115],"Distance":[116],"Functions":[117],"(SDF)":[118],"to":[119,137,147],"reveal":[120],"potentially":[122],"hidden":[123],"organizing":[125],"it":[126,132],"via":[127],"quadtree":[128],"decomposition":[129],"processing":[131],"with":[133,168],"hierarchical":[135],"Transformer":[136],"capture":[138,182],"multi-scale":[139],"dependencies.":[140],"This":[141],"structured":[142],"allows":[144],"support":[148],"both":[149],"high-fidelity":[150],"generation":[151],"accurate":[153],"classification.":[154],"Experiments":[155],"QuickDraw":[158],"TU-Berlin":[160],"datasets":[161],"demonstrated":[162],"classifies":[166],"high":[169],"accuracy":[170],"while":[171],"outputs":[173],"preserve":[175],"structural":[176],"coherence,":[177],"respect":[178],"part":[179],"essential":[183],"conceptual":[184],"patterns":[185],"despite":[186],"scarcity":[188],"original":[193],"sketches.":[194]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2026-02-01T00:00:00"}
