{"id":"https://openalex.org/W4414491631","doi":"https://doi.org/10.1109/tvcg.2025.3613388","title":"SketchRefiner: Text-Guided Sketch Refinement Through Latent Diffusion Models","display_name":"SketchRefiner: Text-Guided Sketch Refinement Through Latent Diffusion Models","publication_year":2025,"publication_date":"2025-09-23","ids":{"openalex":"https://openalex.org/W4414491631","doi":"https://doi.org/10.1109/tvcg.2025.3613388","pmid":"https://pubmed.ncbi.nlm.nih.gov/40986574"},"language":"en","primary_location":{"id":"doi:10.1109/tvcg.2025.3613388","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvcg.2025.3613388","pdf_url":null,"source":{"id":"https://openalex.org/S84775595","display_name":"IEEE Transactions on Visualization and Computer Graphics","issn_l":"1077-2626","issn":["1077-2626","1941-0506","2160-9306"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Visualization and Computer Graphics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032861309","display_name":"Yingjie Tian","orcid":"https://orcid.org/0000-0002-4675-0398"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yingjie Tian","raw_affiliation_strings":["School of Economics and Management, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Economics and Management, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100721945","display_name":"Minghao Liu","orcid":"https://orcid.org/0000-0002-3996-9965"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Minghao Liu","raw_affiliation_strings":["School of Computer Science and Technology, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101694702","display_name":"Haoran Jiang","orcid":"https://orcid.org/0000-0002-1533-1887"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haoran Jiang","raw_affiliation_strings":["School of Mathematical Sciences, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Mathematical Sciences, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021557044","display_name":"Yunbin Tu","orcid":"https://orcid.org/0000-0002-9525-9060"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yunbin Tu","raw_affiliation_strings":["School of Computer Science and Technology, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5087092119","display_name":"Duo Su","orcid":"https://orcid.org/0000-0002-9607-3639"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Duo Su","raw_affiliation_strings":["School of Computer Science and Technology, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5032861309"],"corresponding_institution_ids":["https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.27500906,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"31","issue":"12","first_page":"10711","last_page":"10722"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9890999794006348,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.967199981212616,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sketch","display_name":"Sketch","score":0.5920000076293945},{"id":"https://openalex.org/keywords/initialization","display_name":"Initialization","score":0.5205000042915344},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5116999745368958},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.35280001163482666},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.32109999656677246},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.29840001463890076},{"id":"https://openalex.org/keywords/a-priori-and-a-posteriori","display_name":"A priori and a posteriori","score":0.2806999981403351}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8712999820709229},{"id":"https://openalex.org/C2779231336","wikidata":"https://www.wikidata.org/wiki/Q7534724","display_name":"Sketch","level":2,"score":0.5920000076293945},{"id":"https://openalex.org/C114466953","wikidata":"https://www.wikidata.org/wiki/Q6034165","display_name":"Initialization","level":2,"score":0.5205000042915344},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5116999745368958},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5013999938964844},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.35280001163482666},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.32109999656677246},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.30230000615119934},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.29840001463890076},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.2806999981403351},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.2784999907016754},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.2671999931335449},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2653000056743622},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.26269999146461487},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.26159998774528503},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.26019999384880066},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.25769999623298645},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.25110000371932983},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.2508000135421753}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tvcg.2025.3613388","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvcg.2025.3613388","pdf_url":null,"source":{"id":"https://openalex.org/S84775595","display_name":"IEEE Transactions on Visualization and Computer Graphics","issn_l":"1077-2626","issn":["1077-2626","1941-0506","2160-9306"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Visualization and Computer Graphics","raw_type":"journal-article"},{"id":"pmid:40986574","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40986574","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on visualization and computer graphics","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":55,"referenced_works":["https://openalex.org/W2018685757","https://openalex.org/W2081225124","https://openalex.org/W2175498352","https://openalex.org/W2186546225","https://openalex.org/W2280900767","https://openalex.org/W2289102159","https://openalex.org/W2466618734","https://openalex.org/W2474143829","https://openalex.org/W2501192503","https://openalex.org/W2604662340","https://openalex.org/W2811499654","https://openalex.org/W2883718552","https://openalex.org/W2939230787","https://openalex.org/W2954251965","https://openalex.org/W2962785568","https://openalex.org/W2963636051","https://openalex.org/W3000955797","https://openalex.org/W3032364478","https://openalex.org/W3087797123","https://openalex.org/W3093027278","https://openalex.org/W3107232127","https://openalex.org/W3107593830","https://openalex.org/W3126753585","https://openalex.org/W3157971972","https://openalex.org/W3164412074","https://openalex.org/W4210867585","https://openalex.org/W4213207493","https://openalex.org/W4223918756","https://openalex.org/W4243239098","https://openalex.org/W4285604311","https://openalex.org/W4286611322","https://openalex.org/W4312353784","https://openalex.org/W4312457448","https://openalex.org/W4312915164","https://openalex.org/W4312933868","https://openalex.org/W4319301041","https://openalex.org/W4323892234","https://openalex.org/W4372260515","https://openalex.org/W4382466406","https://openalex.org/W4385271048","https://openalex.org/W4385537492","https://openalex.org/W4386072256","https://openalex.org/W4386076001","https://openalex.org/W4386590352","https://openalex.org/W4388191573","https://openalex.org/W4390204464","https://openalex.org/W4390872497","https://openalex.org/W4390873054","https://openalex.org/W4390873553","https://openalex.org/W4400820794","https://openalex.org/W4401414530","https://openalex.org/W4402727607","https://openalex.org/W4403021266","https://openalex.org/W4403333950","https://openalex.org/W4404195452"],"related_works":[],"abstract_inverted_index":{"Free-hand":[0],"sketches":[1,15,22,56,73,120,170],"serve":[2],"as":[3],"efficient":[4],"tools":[5],"for":[6,18],"creativity":[7],"and":[8,35,112,126,166,178],"communication,":[9],"yet":[10],"expressing":[11],"ideas":[12,34],"clearly":[13],"through":[14,23],"remains":[16,57],"challenging":[17],"untrained":[19],"individuals.":[20],"Optimizing":[21],"text":[24,82,124,153,176],"guidance":[25],"can":[26,163],"enhance":[27],"individuals'":[28],"ability":[29],"to":[30,70,92,118,138],"effectively":[31],"convey":[32],"their":[33],"improve":[36,139],"overall":[37],"communication":[38],"efficiency.":[39],"While":[40],"recent":[41],"advancements":[42],"in":[43,97],"Artificial":[44],"Intelligence":[45],"Generated":[46],"Content":[47],"(AIGC)":[48],"have":[49],"been":[50],"notable,":[51],"research":[52],"on":[53],"optimizing":[54,98],"free-hand":[55,127],"relatively":[58],"unexplored.":[59],"In":[60],"this":[61],"paper,":[62],"we":[63,130,158],"introduce":[64,113],"SketchRefiner,":[65],"an":[66],"innovative":[67],"method":[68,162],"designed":[69],"refine":[71],"rough":[72],"from":[74],"various":[75],"categories":[76],"into":[77],"polished":[78],"versions":[79],"guided":[80],"by":[81],"prompts.":[83],"SketchRefiner":[84,146],"utilizes":[85],"a":[86,94,99,114,132],"latent":[87],"diffusion":[88],"model":[89],"with":[90,122,149,174],"ControlNet":[91],"guide":[93],"differentiable":[95],"rasterizer":[96],"set":[100],"of":[101,142],"B\u00e9zier":[102],"curves.":[103],"We":[104],"extend":[105],"the":[106,140],"score":[107],"distillation":[108],"sampling":[109],"(SDS)":[110],"loss":[111,117],"joint":[115],"semantic":[116],"encourage":[119],"aligned":[121],"given":[123],"prompts":[125,177],"sketches.":[128,144,179],"Additionally,":[129],"propose":[131],"fusion":[133],"attention-map":[134],"stroke":[135],"initialization":[136],"strategy":[137],"quality":[141],"refined":[143,169],"Furthermore,":[145],"provides":[147],"users":[148],"fine-grained":[150],"control":[151],"over":[152],"guidance.":[154],"Through":[155],"extensive":[156],"experiments,":[157],"demonstrate":[159],"that":[160,171],"our":[161],"generate":[164],"accurate":[165],"aesthetically":[167],"pleasing":[168],"closely":[172],"align":[173],"input":[175]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
