{"id":"https://openalex.org/W4366734343","doi":"https://doi.org/10.1145/3591106.3592262","title":"Not Only Generative Art: Stable Diffusion for Content-Style Disentanglement in Art Analysis","display_name":"Not Only Generative Art: Stable Diffusion for Content-Style Disentanglement in Art Analysis","publication_year":2023,"publication_date":"2023-06-08","ids":{"openalex":"https://openalex.org/W4366734343","doi":"https://doi.org/10.1145/3591106.3592262"},"language":"en","primary_location":{"id":"doi:10.1145/3591106.3592262","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3591106.3592262","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3591106.3592262","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2023 ACM International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3591106.3592262","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5024109802","display_name":"Yankun Wu","orcid":"https://orcid.org/0009-0005-7175-8307"},"institutions":[{"id":"https://openalex.org/I98285908","display_name":"The University of Osaka","ror":"https://ror.org/035t8zc32","country_code":"JP","type":"education","lineage":["https://openalex.org/I98285908"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Yankun Wu","raw_affiliation_strings":["Osaka University, Japan"],"raw_orcid":"https://orcid.org/0009-0005-7175-8307","affiliations":[{"raw_affiliation_string":"Osaka University, Japan","institution_ids":["https://openalex.org/I98285908"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065649079","display_name":"Yuta Nakashima","orcid":"https://orcid.org/0000-0001-8000-3567"},"institutions":[{"id":"https://openalex.org/I98285908","display_name":"The University of Osaka","ror":"https://ror.org/035t8zc32","country_code":"JP","type":"education","lineage":["https://openalex.org/I98285908"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yuta Nakashima","raw_affiliation_strings":["Osaka University, Japan"],"raw_orcid":"https://orcid.org/0000-0001-8000-3567","affiliations":[{"raw_affiliation_string":"Osaka University, Japan","institution_ids":["https://openalex.org/I98285908"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5028370193","display_name":"Noa Garc\u00eda","orcid":"https://orcid.org/0000-0002-9200-6359"},"institutions":[{"id":"https://openalex.org/I98285908","display_name":"The University of Osaka","ror":"https://ror.org/035t8zc32","country_code":"JP","type":"education","lineage":["https://openalex.org/I98285908"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Noa Garcia","raw_affiliation_strings":["Osaka University, Japan"],"raw_orcid":"https://orcid.org/0000-0002-9200-6359","affiliations":[{"raw_affiliation_string":"Osaka University, Japan","institution_ids":["https://openalex.org/I98285908"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5024109802"],"corresponding_institution_ids":["https://openalex.org/I98285908"],"apc_list":null,"apc_paid":null,"fwci":2.9437,"has_fulltext":true,"cited_by_count":25,"citation_normalized_percentile":{"value":0.92778836,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"199","last_page":"208"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12650","display_name":"Aesthetic Perception and Analysis","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9771000146865845,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/style","display_name":"Style (visual arts)","score":0.7558631896972656},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.6797112226486206},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6730151772499084},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.6471678018569946},{"id":"https://openalex.org/keywords/content","display_name":"Content (measure theory)","score":0.5113710761070251},{"id":"https://openalex.org/keywords/painting","display_name":"Painting","score":0.5067458748817444},{"id":"https://openalex.org/keywords/comprehension","display_name":"Comprehension","score":0.44564616680145264},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44422686100006104},{"id":"https://openalex.org/keywords/abstract-art","display_name":"Abstract art","score":0.4314594864845276},{"id":"https://openalex.org/keywords/visual-arts","display_name":"Visual arts","score":0.18714559078216553},{"id":"https://openalex.org/keywords/art","display_name":"Art","score":0.1844194233417511},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14062023162841797}],"concepts":[{"id":"https://openalex.org/C2776445246","wikidata":"https://www.wikidata.org/wiki/Q1792644","display_name":"Style (visual arts)","level":2,"score":0.7558631896972656},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.6797112226486206},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6730151772499084},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.6471678018569946},{"id":"https://openalex.org/C2778152352","wikidata":"https://www.wikidata.org/wiki/Q5165061","display_name":"Content (measure theory)","level":2,"score":0.5113710761070251},{"id":"https://openalex.org/C205783811","wikidata":"https://www.wikidata.org/wiki/Q11629","display_name":"Painting","level":2,"score":0.5067458748817444},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.44564616680145264},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44422686100006104},{"id":"https://openalex.org/C4320435","wikidata":"https://www.wikidata.org/wiki/Q128115","display_name":"Abstract art","level":3,"score":0.4314594864845276},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.18714559078216553},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.1844194233417511},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14062023162841797},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3591106.3592262","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3591106.3592262","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3591106.3592262","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2023 ACM International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2304.10278","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2304.10278","pdf_url":"https://arxiv.org/pdf/2304.10278","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.1145/3591106.3592262","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3591106.3592262","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3591106.3592262","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2023 ACM International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.6600000262260437}],"awards":[{"id":"https://openalex.org/G3480760793","display_name":"Understanding Concrete and Abstract Representations in Art","funder_award_id":"20K19822","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G5453712999","display_name":"Bias Mitigation for Deep Neural Networks by Concept-based Image Descriptors","funder_award_id":"23H00497","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"}],"funders":[{"id":"https://openalex.org/F4320334764","display_name":"Japan Society for the Promotion of Science","ror":"https://ror.org/00hhkn466"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4366734343.pdf","grobid_xml":"https://content.openalex.org/works/W4366734343.grobid-xml"},"referenced_works_count":45,"referenced_works":["https://openalex.org/W1793977698","https://openalex.org/W2011615896","https://openalex.org/W2096733369","https://openalex.org/W2161753062","https://openalex.org/W2166242527","https://openalex.org/W2475287302","https://openalex.org/W2603777577","https://openalex.org/W2737047298","https://openalex.org/W2741951152","https://openalex.org/W2766086266","https://openalex.org/W2781305742","https://openalex.org/W2897923591","https://openalex.org/W2901791883","https://openalex.org/W2927066960","https://openalex.org/W2937703861","https://openalex.org/W2962837952","https://openalex.org/W2962883796","https://openalex.org/W2963295540","https://openalex.org/W2963370915","https://openalex.org/W2963890275","https://openalex.org/W2965570799","https://openalex.org/W2981431462","https://openalex.org/W2986779468","https://openalex.org/W2994639901","https://openalex.org/W3093370337","https://openalex.org/W3101540864","https://openalex.org/W3139419286","https://openalex.org/W3141117710","https://openalex.org/W3159481202","https://openalex.org/W3165647589","https://openalex.org/W3171007011","https://openalex.org/W3171101525","https://openalex.org/W3176292403","https://openalex.org/W3204331734","https://openalex.org/W3204522981","https://openalex.org/W3216156094","https://openalex.org/W4281485151","https://openalex.org/W4306820534","https://openalex.org/W4312234230","https://openalex.org/W4312438583","https://openalex.org/W4312677692","https://openalex.org/W4312818263","https://openalex.org/W4312933868","https://openalex.org/W4312977351","https://openalex.org/W4362641980"],"related_works":["https://openalex.org/W2347808479","https://openalex.org/W4365211920","https://openalex.org/W3014948380","https://openalex.org/W4380551139","https://openalex.org/W4317695495","https://openalex.org/W4287117424","https://openalex.org/W4387506531","https://openalex.org/W4238433571","https://openalex.org/W2967848559","https://openalex.org/W4299831724"],"abstract_inverted_index":{"The":[0,50],"duality":[1,42],"of":[2,11,31,53,108,120,155,159,169],"content":[3,21,95,141],"and":[4,26,33,55,73,96,116,142],"style":[5,34,61],"is":[6,39,57,92],"inherent":[7],"to":[8,23,35,79,93,103,139,163],"the":[9,24,29,36,60,65,117,130,156,166],"nature":[10],"art.":[12],"For":[13],"humans,":[14],"these":[15],"two":[16,167],"elements":[17,168],"are":[18],"clearly":[19],"different:":[20],"refers":[22],"objects":[25,54],"concepts":[27,56,115],"in":[28,112,134],"piece":[30],"art,":[32],"way":[37],"it":[38],"expressed.":[40],"This":[41],"poses":[43],"an":[44],"important":[45],"challenge":[46],"for":[47,89],"computer":[48],"vision.":[49],"visual":[51,118],"appearance":[52,119],"modulated":[58],"by":[59],"that":[62,128,146],"may":[63],"reflect":[64],"author\u2019s":[66],"emotions,":[67],"social":[68],"trends,":[69],"artistic":[70,131],"movement,":[71],"etc.,":[72],"their":[74],"deep":[75],"comprehension":[76],"undoubtfully":[77],"requires":[78],"handle":[80],"both.":[81],"A":[82],"promising":[83],"step":[84],"towards":[85],"a":[86,105,126,135,153],"general":[87],"paradigm":[88],"art":[90,170],"analysis":[91],"disentangle":[94,140],"style,":[97],"whereas":[98],"relying":[99],"on":[100],"human":[101],"annotations":[102],"cull":[104],"single":[106],"aspect":[107],"artworks":[109],"has":[110],"limitations":[111],"learning":[113],"semantic":[114],"paintings.":[121],"We":[122],"thus":[123],"present":[124],"GOYA,":[125],"method":[127],"distills":[129],"knowledge":[132],"captured":[133],"recent":[136],"generative":[137],"model":[138],"style.":[143],"Experiments":[144],"show":[145],"synthetically":[147],"generated":[148],"images":[149],"sufficiently":[150],"serve":[151],"as":[152],"proxy":[154],"real":[157],"distribution":[158],"artworks,":[160],"allowing":[161],"GOYA":[162],"separately":[164],"represent":[165],"while":[171],"keeping":[172],"more":[173],"information":[174],"than":[175],"existing":[176],"methods.":[177]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":15},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2023-04-24T00:00:00"}
