{"id":"https://openalex.org/W4372259905","doi":"https://doi.org/10.1109/icassp49357.2023.10094721","title":"End-to-End Unsupervised Sketch to Image Generation","display_name":"End-to-End Unsupervised Sketch to Image Generation","publication_year":2023,"publication_date":"2023-05-05","ids":{"openalex":"https://openalex.org/W4372259905","doi":"https://doi.org/10.1109/icassp49357.2023.10094721"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49357.2023.10094721","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icassp49357.2023.10094721","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043624142","display_name":"Xingming Lv","orcid":null},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]},{"id":"https://openalex.org/I34949971","display_name":"University of Jinan","ror":"https://ror.org/02mjz6f26","country_code":"CN","type":"education","lineage":["https://openalex.org/I34949971"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xingming Lv","raw_affiliation_strings":["ShanDong University,School of Software,Jinan,China","School of Software, ShanDong University, Jinan, China"],"affiliations":[{"raw_affiliation_string":"ShanDong University,School of Software,Jinan,China","institution_ids":["https://openalex.org/I154099455","https://openalex.org/I34949971"]},{"raw_affiliation_string":"School of Software, ShanDong University, Jinan, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101963649","display_name":"Lei Wu","orcid":"https://orcid.org/0009-0007-7363-0002"},"institutions":[{"id":"https://openalex.org/I34949971","display_name":"University of Jinan","ror":"https://ror.org/02mjz6f26","country_code":"CN","type":"education","lineage":["https://openalex.org/I34949971"]},{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Wu","raw_affiliation_strings":["ShanDong University,School of Software,Jinan,China","School of Software, ShanDong University, Jinan, China"],"affiliations":[{"raw_affiliation_string":"ShanDong University,School of Software,Jinan,China","institution_ids":["https://openalex.org/I154099455","https://openalex.org/I34949971"]},{"raw_affiliation_string":"School of Software, ShanDong University, Jinan, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010655699","display_name":"Zhenwei Cheng","orcid":"https://orcid.org/0009-0008-6838-8634"},"institutions":[{"id":"https://openalex.org/I34949971","display_name":"University of Jinan","ror":"https://ror.org/02mjz6f26","country_code":"CN","type":"education","lineage":["https://openalex.org/I34949971"]},{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhenwei Cheng","raw_affiliation_strings":["ShanDong University,School of Software,Jinan,China","School of Software, ShanDong University, Jinan, China"],"affiliations":[{"raw_affiliation_string":"ShanDong University,School of Software,Jinan,China","institution_ids":["https://openalex.org/I154099455","https://openalex.org/I34949971"]},{"raw_affiliation_string":"School of Software, ShanDong University, Jinan, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101536417","display_name":"Xiangxu Meng","orcid":"https://orcid.org/0000-0001-7290-5659"},"institutions":[{"id":"https://openalex.org/I34949971","display_name":"University of Jinan","ror":"https://ror.org/02mjz6f26","country_code":"CN","type":"education","lineage":["https://openalex.org/I34949971"]},{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiangxu Meng","raw_affiliation_strings":["ShanDong University,School of Software,Jinan,China","School of Software, ShanDong University, Jinan, China"],"affiliations":[{"raw_affiliation_string":"ShanDong University,School of Software,Jinan,China","institution_ids":["https://openalex.org/I154099455","https://openalex.org/I34949971"]},{"raw_affiliation_string":"School of Software, ShanDong University, Jinan, China","institution_ids":["https://openalex.org/I154099455"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5043624142"],"corresponding_institution_ids":["https://openalex.org/I154099455","https://openalex.org/I34949971"],"apc_list":null,"apc_paid":null,"fwci":0.123,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.37217502,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"27","issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.9940000176429749,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sketch","display_name":"Sketch","score":0.7364903688430786},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6693261861801147},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4965277314186096},{"id":"https://openalex.org/keywords/end-to-end-principle","display_name":"End-to-end principle","score":0.4815240502357483},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4702913761138916},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.44944360852241516},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.35387423634529114},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.14138612151145935}],"concepts":[{"id":"https://openalex.org/C2779231336","wikidata":"https://www.wikidata.org/wiki/Q7534724","display_name":"Sketch","level":2,"score":0.7364903688430786},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6693261861801147},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4965277314186096},{"id":"https://openalex.org/C74296488","wikidata":"https://www.wikidata.org/wiki/Q2527392","display_name":"End-to-end principle","level":2,"score":0.4815240502357483},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4702913761138916},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.44944360852241516},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.35387423634529114},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.14138612151145935}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49357.2023.10094721","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icassp49357.2023.10094721","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.7300000190734863,"id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W398859631","https://openalex.org/W2026019603","https://openalex.org/W2475287302","https://openalex.org/W2884466206","https://openalex.org/W2962793481","https://openalex.org/W2963073614","https://openalex.org/W2963561004","https://openalex.org/W2963814095","https://openalex.org/W2963890275","https://openalex.org/W2965833116","https://openalex.org/W2981824749","https://openalex.org/W2997008662","https://openalex.org/W3035124078","https://openalex.org/W3106820655","https://openalex.org/W3115218903","https://openalex.org/W3175344711","https://openalex.org/W3203605797","https://openalex.org/W4213207493","https://openalex.org/W4249986286","https://openalex.org/W4294643831","https://openalex.org/W4320013936","https://openalex.org/W6713645886","https://openalex.org/W6729966448","https://openalex.org/W6752378368","https://openalex.org/W6775083062"],"related_works":["https://openalex.org/W2378994405","https://openalex.org/W2385974820","https://openalex.org/W2373478030","https://openalex.org/W2378679551","https://openalex.org/W3149739944","https://openalex.org/W2392363776","https://openalex.org/W2063051341","https://openalex.org/W2591066345","https://openalex.org/W1494563618","https://openalex.org/W2357022711"],"abstract_inverted_index":{"A":[0],"freehand":[1,19,87,183],"sketch":[2,44],"is":[3,94,103,160],"geometrically":[4],"distorted":[5,65],"and":[6,10,35,46,67,69,90,122,127,135,157,166,170],"lacks":[7],"colors,":[8,68],"textures,":[9],"other":[11],"visual":[12],"details.":[13],"This":[14],"leads":[15],"to":[16,30,74,84,104,109,178],"challenges":[17],"in":[18],"sketch-to-image":[20,88],"generation":[21],"tasks.":[22],"Many":[23],"existing":[24],"works":[25],"take":[26],"a":[27,106,145],"multistage":[28],"strategy":[29],"generate":[31,179],"images":[32,59,181],"from":[33,182],"sketches,":[34],"they":[36],"depend":[37],"on":[38,96,131,151,162],"the":[39,42,48,52,57,76,86,91,114,132,152],"shape":[40,49,70,107,111],"of":[41,51,61,138,155],"input":[43],"badly":[45],"ignore":[47],"adjustment":[50],"generated":[53,58,115],"image.":[54,116],"More":[55],"importantly,":[56],"are":[60],"low":[62],"quality":[63],"with":[64],"textures":[66],"deformation.":[71],"In":[72],"order":[73],"overcome":[75],"above":[77],"challenges,":[78],"we":[79,118,173],"propose":[80,105],"an":[81,97,139],"end-to-end":[82],"method":[83],"accomplish":[85],"task,":[89],"proposed":[92],"architecture":[93],"based":[95,150],"unsupervised":[98],"network.":[99],"Our":[100],"key":[101],"insight":[102],"discriminator":[108],"provide":[110],"constraints":[112],"for":[113],"Besides,":[117],"introduce":[119],"Image-Global":[120],"Attention(IGA)":[121],"Focal":[123],"Frequency":[124],"Loss(FFL).":[125],"IGA":[126],"FFL":[128],"mainly":[129],"focuses":[130],"whole":[133],"image":[134],"every":[136],"patch":[137],"image,":[140],"respectively.":[141],"We":[142],"also":[143],"extend":[144],"new":[146],"dataset":[147],"called":[148],"NewGiraffe":[149],"giraffe":[153],"class":[154],"SketchyCOCO,":[156],"our":[158,175],"approach":[159],"validated":[161],"two":[163],"datasets:":[164],"Shoes":[165],"NewGiraffe.":[167],"Through":[168],"qualitative":[169],"quantitative":[171],"results,":[172],"demonstrate":[174],"method\u2019s":[176],"ability":[177],"realistic":[180],"sketches.":[184]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-12-24T23:09:58.560324","created_date":"2025-10-10T00:00:00"}
