{"id":"https://openalex.org/W4399794198","doi":"https://doi.org/10.48550/arxiv.2406.10429","title":"Consistency-diversity-realism Pareto fronts of conditional image generative models","display_name":"Consistency-diversity-realism Pareto fronts of conditional image generative models","publication_year":2024,"publication_date":"2024-06-14","ids":{"openalex":"https://openalex.org/W4399794198","doi":"https://doi.org/10.48550/arxiv.2406.10429"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2406.10429","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.10429","pdf_url":"https://arxiv.org/pdf/2406.10429","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2406.10429","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049825997","display_name":"Pietro Astolfi","orcid":"https://orcid.org/0000-0002-5192-9608"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Astolfi, Pietro","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045602407","display_name":"Marl\u00e8ne Careil","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Careil, Marlene","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102935600","display_name":"Melissa Hall","orcid":"https://orcid.org/0009-0009-0509-1654"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hall, Melissa","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010595613","display_name":"Oscar Ma\u00f1as","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma\u00f1as, Oscar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029739727","display_name":"Matthew J. Muckley","orcid":"https://orcid.org/0000-0002-6525-8817"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Muckley, Matthew","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040312210","display_name":"Jakob Verbeek","orcid":"https://orcid.org/0000-0003-1419-1816"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Verbeek, Jakob","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080039924","display_name":"Adriana Romero","orcid":"https://orcid.org/0000-0003-3604-6281"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Soriano, Adriana Romero","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5024536150","display_name":"Michal Drozdzal","orcid":"https://orcid.org/0000-0002-0661-6338"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Drozdzal, Michal","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5049825997"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10778","display_name":"Philosophy and History of Science","score":0.22089999914169312,"subfield":{"id":"https://openalex.org/subfields/1207","display_name":"History and Philosophy of Science"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10778","display_name":"Philosophy and History of Science","score":0.22089999914169312,"subfield":{"id":"https://openalex.org/subfields/1207","display_name":"History and Philosophy of Science"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.7955604195594788},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.687303364276886},{"id":"https://openalex.org/keywords/pareto-principle","display_name":"Pareto principle","score":0.6478419303894043},{"id":"https://openalex.org/keywords/diversity","display_name":"Diversity (politics)","score":0.5927121639251709},{"id":"https://openalex.org/keywords/realism","display_name":"Realism","score":0.5530539155006409},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4298310875892639},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.4062448740005493},{"id":"https://openalex.org/keywords/econometrics","display_name":"Econometrics","score":0.4029596149921417},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.39733949303627014},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36048072576522827},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.32809728384017944},{"id":"https://openalex.org/keywords/mathematical-economics","display_name":"Mathematical economics","score":0.3204529881477356},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.3060360848903656},{"id":"https://openalex.org/keywords/epistemology","display_name":"Epistemology","score":0.21579766273498535},{"id":"https://openalex.org/keywords/sociology","display_name":"Sociology","score":0.19957947731018066},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.18327492475509644}],"concepts":[{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.7955604195594788},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.687303364276886},{"id":"https://openalex.org/C137635306","wikidata":"https://www.wikidata.org/wiki/Q182667","display_name":"Pareto principle","level":2,"score":0.6478419303894043},{"id":"https://openalex.org/C2781316041","wikidata":"https://www.wikidata.org/wiki/Q1230584","display_name":"Diversity (politics)","level":2,"score":0.5927121639251709},{"id":"https://openalex.org/C543847140","wikidata":"https://www.wikidata.org/wiki/Q2642826","display_name":"Realism","level":2,"score":0.5530539155006409},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4298310875892639},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.4062448740005493},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.4029596149921417},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.39733949303627014},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36048072576522827},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.32809728384017944},{"id":"https://openalex.org/C144237770","wikidata":"https://www.wikidata.org/wiki/Q747534","display_name":"Mathematical economics","level":1,"score":0.3204529881477356},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.3060360848903656},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.21579766273498535},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.19957947731018066},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.18327492475509644},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2406.10429","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.10429","pdf_url":"https://arxiv.org/pdf/2406.10429","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},{"id":"doi:10.48550/arxiv.2406.10429","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2406.10429","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2406.10429","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.10429","pdf_url":"https://arxiv.org/pdf/2406.10429","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2380075625","https://openalex.org/W2387507339","https://openalex.org/W4390718435","https://openalex.org/W4390549206","https://openalex.org/W3137171911","https://openalex.org/W4379540039","https://openalex.org/W4237784285","https://openalex.org/W2374712251","https://openalex.org/W4206705773","https://openalex.org/W1603736412"],"abstract_inverted_index":{"Building":[0],"world":[1,10,27,35,264],"models":[2,19,31,59,81,109,158,171,198,206],"that":[3,65,79,90,118,129,156,191,226],"accurately":[4],"and":[5,45,75,98,107,110,131,146,164,168,212,232],"comprehensively":[6],"represent":[7],"the":[8,12,92,178,192,233,241,249],"real":[9],"is":[11,228],"utmost":[13],"aspiration":[14],"for":[15],"conditional":[16],"image":[17,43,73],"generative":[18,58,80],"as":[20,26,256],"it":[21],"would":[22],"enable":[23],"their":[24,111],"use":[25,104],"simulators.":[28],"For":[29],"these":[30],"to":[32,113,200,252,260],"be":[33,135,238],"successful":[34],"models,":[36],"they":[37],"should":[38,237],"not":[39],"only":[40],"excel":[41,172],"at":[42,150,161],"quality":[44,74],"prompt-image":[46],"consistency":[47,132],"but":[48],"also":[49],"ensure":[50],"high":[51],"representation":[52,162,179],"diversity.":[53,99,147,180],"However,":[54],"current":[55],"research":[56,250],"in":[57,166,173,207],"mostly":[60],"focuses":[61],"on":[62,123,185],"creative":[63],"applications":[64],"are":[66,159],"predominantly":[67],"concerned":[68],"with":[69],"human":[70],"preferences":[71],"of":[72,94,195,210,235],"aesthetics.":[76],"We":[77],"note":[78,155],"have":[82],"inference":[83],"time":[84],"mechanisms":[85],"-":[86,89],"or":[87],"knobs":[88,112],"allow":[91],"control":[93],"generation":[95],"consistency,":[96],"quality,":[97],"In":[100],"this":[101,245],"paper,":[102],"we":[103,154,189,247],"state-of-the-art":[105],"text-to-image":[106],"image-and-text-to-image":[108],"draw":[114],"consistency-diversity-realism":[115,124,216],"Pareto":[116,151,183,254],"fronts":[117,184,255],"provide":[119],"a":[120,141,186],"holistic":[121],"view":[122],"multi-objective.":[125],"Our":[126],"experiments":[127],"suggest":[128],"realism":[130],"can":[133],"both":[134],"improved":[136],"simultaneously;":[137],"however":[138],"there":[139,213,227],"exists":[140],"clear":[142],"tradeoff":[143],"between":[144,218],"realism/consistency":[145],"By":[148,181],"looking":[149],"optimal":[152],"points,":[153],"earlier":[157],"better":[160,202],"diversity":[163],"worse":[165],"consistency/realism,":[167],"more":[169,204],"recent":[170,205],"consistency/realism":[174],"while":[175],"decreasing":[176],"significantly":[177],"computing":[182],"geodiverse":[187],"dataset,":[188],"find":[190],"first":[193],"version":[194],"latent":[196],"diffusion":[197],"tends":[199],"perform":[201],"than":[203],"all":[208],"axes":[209],"evaluation,":[211],"exist":[214],"pronounced":[215],"disparities":[217],"geographical":[219],"regions.":[220],"Overall,":[221],"our":[222],"analysis":[223],"clearly":[224],"shows":[225],"no":[229],"best":[230],"model":[231,236],"choice":[234],"determined":[239],"by":[240],"downstream":[242],"application.":[243],"With":[244],"analysis,":[246],"invite":[248],"community":[251],"consider":[253],"an":[257],"analytical":[258],"tool":[259],"measure":[261],"progress":[262],"towards":[263],"models.":[265]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
