{"id":"https://openalex.org/W4404520905","doi":"https://doi.org/10.1109/tvcg.2024.3502395","title":"MixSA: Training-Free Reference-Based Sketch Extraction via Mixture-of-Self-Attention","display_name":"MixSA: Training-Free Reference-Based Sketch Extraction via Mixture-of-Self-Attention","publication_year":2024,"publication_date":"2024-11-19","ids":{"openalex":"https://openalex.org/W4404520905","doi":"https://doi.org/10.1109/tvcg.2024.3502395","pmid":"https://pubmed.ncbi.nlm.nih.gov/40030381"},"language":"en","primary_location":{"id":"doi:10.1109/tvcg.2024.3502395","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvcg.2024.3502395","pdf_url":null,"source":{"id":"https://openalex.org/S84775595","display_name":"IEEE Transactions on Visualization and Computer Graphics","issn_l":"1077-2626","issn":["1077-2626","1941-0506","2160-9306"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Visualization and Computer Graphics","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2501.00816","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113365120","display_name":"Rui Yang","orcid":"https://orcid.org/0000-0002-1996-2993"},"institutions":[{"id":"https://openalex.org/I88830068","display_name":"Shaanxi Normal University","ror":"https://ror.org/0170z8493","country_code":"CN","type":"education","lineage":["https://openalex.org/I88830068"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Rui Yang","raw_affiliation_strings":["School of Computer Sciences, Shaanxi Normal University, Xi&#x2019;an, China","School of Computer Sciences, Shaanxi Normal University, Xi&#x0027;an, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Sciences, Shaanxi Normal University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I88830068"]},{"raw_affiliation_string":"School of Computer Sciences, Shaanxi Normal University, Xi&#x0027;an, China","institution_ids":["https://openalex.org/I88830068"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Xiaojun Wu","orcid":"https://orcid.org/0000-0002-7779-553X"},"institutions":[{"id":"https://openalex.org/I88830068","display_name":"Shaanxi Normal University","ror":"https://ror.org/0170z8493","country_code":"CN","type":"education","lineage":["https://openalex.org/I88830068"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaojun Wu","raw_affiliation_strings":["School of Computer Science and the Key Laboratory of Intelligent Computing and Service Technology for Folk Song of the Ministry of Culture and Tourism, Shaanxi Normal University, Xi&#x2019;an, China","School of Computer Science and the Key Laboratory of Intelligent Computing and Service Technology for Folk Song of the Ministry of Culture and Tourism, Shaanxi Normal University, Xi&#x0027;an, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and the Key Laboratory of Intelligent Computing and Service Technology for Folk Song of the Ministry of Culture and Tourism, Shaanxi Normal University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I88830068"]},{"raw_affiliation_string":"School of Computer Science and the Key Laboratory of Intelligent Computing and Service Technology for Folk Song of the Ministry of Culture and Tourism, Shaanxi Normal University, Xi&#x0027;an, China","institution_ids":["https://openalex.org/I88830068"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056103024","display_name":"Shengfeng He","orcid":"https://orcid.org/0000-0002-3802-4644"},"institutions":[{"id":"https://openalex.org/I79891267","display_name":"Singapore Management University","ror":"https://ror.org/050qmg959","country_code":"SG","type":"education","lineage":["https://openalex.org/I79891267"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Shengfeng He","raw_affiliation_strings":["School of Computing and Information Systems, Singapore Management University, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Computing and Information Systems, Singapore Management University, Singapore","institution_ids":["https://openalex.org/I79891267"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5113365120"],"corresponding_institution_ids":["https://openalex.org/I88830068"],"apc_list":null,"apc_paid":null,"fwci":1.2401,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.88743693,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":"31","issue":"9","first_page":"6208","last_page":"6222"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.991599977016449,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.9799000024795532,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sketch","display_name":"Sketch","score":0.9090568423271179},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8588947057723999},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5989629030227661},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.5236920118331909},{"id":"https://openalex.org/keywords/fidelity","display_name":"Fidelity","score":0.4733163118362427},{"id":"https://openalex.org/keywords/interpolation","display_name":"Interpolation (computer graphics)","score":0.45034146308898926},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.43280279636383057},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.42019107937812805},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3786684274673462},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.26118940114974976},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.14344531297683716},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08313283324241638}],"concepts":[{"id":"https://openalex.org/C2779231336","wikidata":"https://www.wikidata.org/wiki/Q7534724","display_name":"Sketch","level":2,"score":0.9090568423271179},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8588947057723999},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5989629030227661},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.5236920118331909},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.4733163118362427},{"id":"https://openalex.org/C137800194","wikidata":"https://www.wikidata.org/wiki/Q11713455","display_name":"Interpolation (computer graphics)","level":3,"score":0.45034146308898926},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.43280279636383057},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.42019107937812805},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3786684274673462},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.26118940114974976},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.14344531297683716},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08313283324241638},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/tvcg.2024.3502395","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvcg.2024.3502395","pdf_url":null,"source":{"id":"https://openalex.org/S84775595","display_name":"IEEE Transactions on Visualization and Computer Graphics","issn_l":"1077-2626","issn":["1077-2626","1941-0506","2160-9306"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Visualization and Computer Graphics","raw_type":"journal-article"},{"id":"pmid:40030381","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40030381","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on visualization and computer graphics","raw_type":null},{"id":"pmh:oai:arXiv.org:2501.00816","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.00816","pdf_url":"https://arxiv.org/pdf/2501.00816","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:ink.library.smu.edu.sg:sis_research-11535","is_oa":true,"landing_page_url":"https://ink.library.smu.edu.sg/sis_research/10533","pdf_url":null,"source":{"id":"https://openalex.org/S4306401925","display_name":"Singapore Management University Institutional Knowledge (InK) (Singapore Management University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79891267","host_organization_name":"Singapore Management University","host_organization_lineage":["https://openalex.org/I79891267"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"https://doi.org/10.1109/TVCG.2024.3502395","raw_type":"Journal Article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2501.00816","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.00816","pdf_url":"https://arxiv.org/pdf/2501.00816","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6642458801","display_name":null,"funder_award_id":"11872036","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8916415075","display_name":null,"funder_award_id":"62377034","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320320709","display_name":"National Research Foundation Singapore","ror":"https://ror.org/03cpyc314"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":52,"referenced_works":["https://openalex.org/W845365781","https://openalex.org/W1901129140","https://openalex.org/W1993935870","https://openalex.org/W2109854212","https://openalex.org/W2133665775","https://openalex.org/W2145023731","https://openalex.org/W2412782625","https://openalex.org/W2475287302","https://openalex.org/W2603777577","https://openalex.org/W2800409282","https://openalex.org/W2891833067","https://openalex.org/W2914578055","https://openalex.org/W2946220758","https://openalex.org/W2953881420","https://openalex.org/W2957909335","https://openalex.org/W2962785568","https://openalex.org/W2963185411","https://openalex.org/W2963890275","https://openalex.org/W2972003492","https://openalex.org/W3025800305","https://openalex.org/W3034826836","https://openalex.org/W3203398299","https://openalex.org/W4213207493","https://openalex.org/W4285414583","https://openalex.org/W4286611322","https://openalex.org/W4311804474","https://openalex.org/W4312353784","https://openalex.org/W4312933868","https://openalex.org/W4319300559","https://openalex.org/W4381334907","https://openalex.org/W4385245566","https://openalex.org/W4385276764","https://openalex.org/W4386065733","https://openalex.org/W4386071613","https://openalex.org/W4386076532","https://openalex.org/W4388692607","https://openalex.org/W4390190098","https://openalex.org/W4390871782","https://openalex.org/W4390871856","https://openalex.org/W4390872497","https://openalex.org/W4390874265","https://openalex.org/W4390874393","https://openalex.org/W4400582187","https://openalex.org/W4402667886","https://openalex.org/W4402715897","https://openalex.org/W4402716004","https://openalex.org/W6780043386","https://openalex.org/W6783713337","https://openalex.org/W6855771293","https://openalex.org/W6862213106","https://openalex.org/W6863631979","https://openalex.org/W7036952098"],"related_works":["https://openalex.org/W2378994405","https://openalex.org/W2385974820","https://openalex.org/W2373478030","https://openalex.org/W2378679551","https://openalex.org/W3149739944","https://openalex.org/W2392363776","https://openalex.org/W2063051341","https://openalex.org/W2591066345","https://openalex.org/W1494563618","https://openalex.org/W2357022711"],"abstract_inverted_index":{"Current":[0],"sketch":[1,30,40,136],"extraction":[2,31],"methods":[3,150],"either":[4],"require":[5],"extensive":[6],"training":[7],"or":[8],"fail":[9],"to":[10,89,155],"capture":[11],"a":[12,28,47,164],"wide":[13,165],"range":[14,166],"of":[15,71,103,119,148,167],"artistic":[16,168],"styles,":[17],"limiting":[18],"their":[19],"practical":[20],"applicability":[21],"and":[22,58,84,101,139],"versatility.":[23],"We":[24],"introduce":[25],"Mixture-of-Self-Attention":[26],"(MixSA),":[27],"training-free":[29],"method":[32],"that":[33,160],"leverages":[34],"strong":[35],"diffusion":[36],"priors":[37],"for":[38,67],"enhanced":[39],"perception.":[41],"At":[42],"its":[43],"core,":[44],"MixSA":[45,114,131],"employs":[46],"mixture-of-self-attention":[48],"technique,":[49],"which":[50],"manipulates":[51],"self-attention":[52],"layers":[53,110],"by":[54,122],"substituting":[55],"the":[56,68,99,116,146],"keys":[57],"values":[59],"with":[60,98,127],"those":[61],"from":[62],"reference":[63],"sketches.":[64],"This":[65,141],"allows":[66],"seamless":[69],"integration":[70],"brushstroke":[72,96],"elements":[73],"into":[74],"initial":[75,124],"outline":[76],"images,":[77,105],"offering":[78],"precise":[79],"control":[80],"over":[81],"texture":[82,100],"density":[83],"enabling":[85],"interpolation":[86],"between":[87],"styles":[88,97],"create":[90],"novel,":[91],"unseen":[92],"styles.":[93],"By":[94],"aligning":[95],"contours":[102],"colored":[104],"particularly":[106],"in":[107,135],"late":[108],"decoder":[109],"handling":[111],"local":[112],"textures,":[113],"addresses":[115],"common":[117],"issue":[118],"color":[120],"averaging":[121],"adjusting":[123],"outlines.":[125],"Evaluated":[126],"various":[128],"perceptual":[129],"metrics,":[130],"demonstrates":[132],"superior":[133],"performance":[134],"quality,":[137],"flexibility,":[138],"applicability.":[140],"approach":[142],"not":[143],"only":[144],"overcomes":[145],"limitations":[147],"existing":[149],"but":[151],"also":[152],"empowers":[153],"users":[154],"generate":[156],"diverse,":[157],"high-fidelity":[158],"sketches":[159],"more":[161],"accurately":[162],"reflect":[163],"expressions.":[169]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
