{"id":"https://openalex.org/W4386437562","doi":"https://doi.org/10.1145/3607828.3617796","title":"Diffusion Model with Clustering-based Conditioning for Food Image Generation","display_name":"Diffusion Model with Clustering-based Conditioning for Food Image Generation","publication_year":2023,"publication_date":"2023-10-26","ids":{"openalex":"https://openalex.org/W4386437562","doi":"https://doi.org/10.1145/3607828.3617796"},"language":"en","primary_location":{"id":"doi:10.1145/3607828.3617796","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3607828.3617796","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3607828.3617796","source":null,"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 8th International Workshop on Multimedia Assisted Dietary Management","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3607828.3617796","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5083913830","display_name":"Yue Han","orcid":"https://orcid.org/0000-0003-4494-5455"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yue Han","raw_affiliation_strings":["Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063620170","display_name":"Jiangpeng He","orcid":"https://orcid.org/0000-0002-8552-9880"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiangpeng He","raw_affiliation_strings":["Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020169677","display_name":"Mridul Gupta","orcid":"https://orcid.org/0000-0001-6181-1403"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mridul Gupta","raw_affiliation_strings":["Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089688702","display_name":"Edward J. Delp","orcid":"https://orcid.org/0000-0002-2909-7323"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Edward J. Delp","raw_affiliation_strings":["Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001380619","display_name":"Fengqing Zhu","orcid":"https://orcid.org/0000-0002-3863-3220"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Fengqing Zhu","raw_affiliation_strings":["Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5083913830"],"corresponding_institution_ids":["https://openalex.org/I219193219"],"apc_list":null,"apc_paid":null,"fwci":3.8088,"has_fulltext":true,"cited_by_count":13,"citation_normalized_percentile":{"value":0.93505087,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"61","last_page":"69"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10866","display_name":"Nutritional Studies and Diet","score":0.9861999750137329,"subfield":{"id":"https://openalex.org/subfields/2739","display_name":"Public Health, Environmental and Occupational Health"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T10866","display_name":"Nutritional Studies and Diet","score":0.9861999750137329,"subfield":{"id":"https://openalex.org/subfields/2739","display_name":"Public Health, Environmental and Occupational Health"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9605000019073486,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11925","display_name":"Culinary Culture and Tourism","score":0.9244999885559082,"subfield":{"id":"https://openalex.org/subfields/1106","display_name":"Food Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7506018877029419},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6872912645339966},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5184444785118103},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.516939103603363},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5064798593521118},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.4787306487560272},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4272370934486389},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3867374360561371},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.3444865345954895}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7506018877029419},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6872912645339966},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5184444785118103},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.516939103603363},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5064798593521118},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.4787306487560272},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4272370934486389},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3867374360561371},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.3444865345954895},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3607828.3617796","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3607828.3617796","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3607828.3617796","source":null,"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 8th International Workshop on Multimedia Assisted Dietary Management","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2309.00199","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2309.00199","pdf_url":"https://arxiv.org/pdf/2309.00199","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.1145/3607828.3617796","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3607828.3617796","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3607828.3617796","source":null,"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 8th International Workshop on Multimedia Assisted Dietary Management","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Zero hunger","score":0.6200000047683716,"id":"https://metadata.un.org/sdg/2"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4386437562.pdf","grobid_xml":"https://content.openalex.org/works/W4386437562.grobid-xml"},"referenced_works_count":60,"referenced_works":["https://openalex.org/W12634471","https://openalex.org/W639708223","https://openalex.org/W1835579201","https://openalex.org/W2091013587","https://openalex.org/W2117539524","https://openalex.org/W2119168155","https://openalex.org/W2125269571","https://openalex.org/W2165232124","https://openalex.org/W2183341477","https://openalex.org/W2194775991","https://openalex.org/W2543791385","https://openalex.org/W2560828904","https://openalex.org/W2562357606","https://openalex.org/W2612690371","https://openalex.org/W2730200455","https://openalex.org/W2796855877","https://openalex.org/W2824941129","https://openalex.org/W2858926098","https://openalex.org/W2935951707","https://openalex.org/W2954996726","https://openalex.org/W2962691457","https://openalex.org/W2963037989","https://openalex.org/W2963351448","https://openalex.org/W2980407281","https://openalex.org/W2991915699","https://openalex.org/W2999905431","https://openalex.org/W3005797892","https://openalex.org/W3009381623","https://openalex.org/W3034451759","https://openalex.org/W3035574324","https://openalex.org/W3041350610","https://openalex.org/W3046372357","https://openalex.org/W3080950656","https://openalex.org/W3091123787","https://openalex.org/W3135185741","https://openalex.org/W3138317816","https://openalex.org/W3138540374","https://openalex.org/W3173138851","https://openalex.org/W3180196270","https://openalex.org/W3180355996","https://openalex.org/W3181518652","https://openalex.org/W3182381947","https://openalex.org/W3198052526","https://openalex.org/W3202232857","https://openalex.org/W3205553363","https://openalex.org/W3215720729","https://openalex.org/W3217076946","https://openalex.org/W4285295719","https://openalex.org/W4306964670","https://openalex.org/W4312497550","https://openalex.org/W4312749295","https://openalex.org/W4312933868","https://openalex.org/W4319996536","https://openalex.org/W4362684530","https://openalex.org/W4385801415","https://openalex.org/W4386057725","https://openalex.org/W4386065848","https://openalex.org/W4386076368","https://openalex.org/W6600407735","https://openalex.org/W6725504251"],"related_works":["https://openalex.org/W4365211920","https://openalex.org/W3014948380","https://openalex.org/W4380551139","https://openalex.org/W4317695495","https://openalex.org/W4395044357","https://openalex.org/W4287117424","https://openalex.org/W4387506531","https://openalex.org/W2087346071","https://openalex.org/W2967848559","https://openalex.org/W4299831724"],"abstract_inverted_index":{"Image-based":[0],"dietary":[1],"assessment":[2],"serves":[3],"as":[4,20,33],"an":[5,162],"efficient":[6],"and":[7,12,37,68,160,172,185],"accurate":[8],"solution":[9,79],"for":[10,51,86,103,124,169],"recording":[11],"analyzing":[13],"nutrition":[14],"intake":[15],"using":[16,219],"eating":[17],"occasion":[18],"images":[19,48,73,85,110,133,153,203],"input.":[21],"Deep":[22],"learning-based":[23],"techniques":[24],"are":[25],"commonly":[26],"used":[27],"to":[28,60,81,138],"perform":[29],"image":[30,126,193],"analysis":[31],"such":[32,54],"food":[34,47,72,84,109,132,152,174,202,217],"classification,":[35],"segmentation,":[36],"portion":[38],"size":[39],"estimation,":[40],"which":[41],"rely":[42],"on":[43,155,181],"large":[44],"amounts":[45],"of":[46,71,96,107,131,150],"with":[49,191],"annotations":[50],"training.":[52],"However,":[53],"data":[55,87],"dependency":[56],"poses":[57],"significant":[58],"barriers":[59],"real-world":[61],"applications,":[62],"because":[63],"acquiring":[64],"a":[65],"substantial,":[66],"diverse,":[67],"balanced":[69],"set":[70],"can":[74,134,207],"be":[75,135],"challenging.":[76],"One":[77],"potential":[78],"is":[80,179],"use":[82,95],"synthetic":[83,108,151,201],"augmentation.":[88],"Although":[89],"existing":[90,192],"work":[91],"has":[92],"explored":[93],"the":[94,105,129,139,148,156,182,200,210,220],"generative":[97,118],"adversarial":[98],"networks":[99],"(GAN)":[100],"based":[101,154],"structures":[102],"generation,":[104],"quality":[106],"still":[111],"remains":[112],"subpar.":[113],"In":[114,143],"addition,":[115],"while":[116],"diffusion-based":[117],"models":[119],"have":[120],"shown":[121],"promising":[122],"results":[123],"general":[125],"generation":[127,130,149,194],"tasks,":[128],"challenging":[136],"due":[137],"substantial":[140],"intra-class":[141],"variance.":[142],"this":[144],"paper,":[145],"we":[146],"investigate":[147],"conditional":[157],"diffusion":[158],"model":[159],"propose":[161],"effective":[163],"clustering-based":[164],"training":[165],"framework,":[166],"named":[167],"ClusDiff,":[168],"generating":[170],"high-quality":[171],"representative":[173],"images.":[175],"The":[176],"proposed":[177],"method":[178],"evaluated":[180],"Food-101":[183],"dataset":[184],"shows":[186],"improved":[187],"performance":[188],"when":[189],"compared":[190],"works.":[195],"We":[196],"also":[197],"demonstrate":[198],"that":[199],"generated":[204],"by":[205],"ClusDiff":[206],"help":[208],"address":[209],"severe":[211],"class":[212],"imbalance":[213],"issue":[214],"in":[215],"long-tailed":[216],"classification":[218],"VFN-LT":[221],"dataset.":[222]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2023-09-06T00:00:00"}
