{"id":"https://openalex.org/W3207441221","doi":"https://doi.org/10.1145/3474085.3475525","title":"Diverse Multimedia Layout Generation with Multi Choice Learning","display_name":"Diverse Multimedia Layout Generation with Multi Choice Learning","publication_year":2021,"publication_date":"2021-10-17","ids":{"openalex":"https://openalex.org/W3207441221","doi":"https://doi.org/10.1145/3474085.3475525","mag":"3207441221"},"language":"en","primary_location":{"id":"doi:10.1145/3474085.3475525","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3474085.3475525","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2301.06629","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113883562","display_name":"David D. Nguyen","orcid":null},"institutions":[{"id":"https://openalex.org/I31746571","display_name":"UNSW Sydney","ror":"https://ror.org/03r8z3t63","country_code":"AU","type":"education","lineage":["https://openalex.org/I31746571"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"David D. Nguyen","raw_affiliation_strings":["University of New South Wales, Sydney, NSW, Australia"],"affiliations":[{"raw_affiliation_string":"University of New South Wales, Sydney, NSW, Australia","institution_ids":["https://openalex.org/I31746571"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082256444","display_name":"\u202aSurya Nepal\u202c","orcid":"https://orcid.org/0000-0002-3289-6599"},"institutions":[{"id":"https://openalex.org/I42894916","display_name":"Data61","ror":"https://ror.org/03q397159","country_code":"AU","type":"other","lineage":["https://openalex.org/I1292875679","https://openalex.org/I2801453606","https://openalex.org/I42894916","https://openalex.org/I4387156119"]},{"id":"https://openalex.org/I1292875679","display_name":"Commonwealth Scientific and Industrial Research Organisation","ror":"https://ror.org/03qn8fb07","country_code":"AU","type":"funder","lineage":["https://openalex.org/I1292875679","https://openalex.org/I2801453606","https://openalex.org/I4387156119"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Surya Nepal","raw_affiliation_strings":["CSIRO, Data61, Sydney, NSW, Australia"],"affiliations":[{"raw_affiliation_string":"CSIRO, Data61, Sydney, NSW, Australia","institution_ids":["https://openalex.org/I42894916","https://openalex.org/I1292875679"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059077090","display_name":"Salil S. Kanhere","orcid":"https://orcid.org/0000-0002-1835-3475"},"institutions":[{"id":"https://openalex.org/I31746571","display_name":"UNSW Sydney","ror":"https://ror.org/03r8z3t63","country_code":"AU","type":"education","lineage":["https://openalex.org/I31746571"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Salil S. Kanhere","raw_affiliation_strings":["University of New South Wales Sydney, Sydney, NSW, Australia"],"affiliations":[{"raw_affiliation_string":"University of New South Wales Sydney, Sydney, NSW, Australia","institution_ids":["https://openalex.org/I31746571"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5113883562"],"corresponding_institution_ids":["https://openalex.org/I31746571"],"apc_list":null,"apc_paid":null,"fwci":0.9689,"has_fulltext":true,"cited_by_count":12,"citation_normalized_percentile":{"value":0.77928162,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"218","last_page":"226"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9926000237464905,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11666","display_name":"Color Science and Applications","score":0.989300012588501,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7902147769927979},{"id":"https://openalex.org/keywords/logos-bible-software","display_name":"Logos Bible Software","score":0.6642200350761414},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.5356191396713257},{"id":"https://openalex.org/keywords/logo","display_name":"Logo (programming language)","score":0.5324994325637817},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.5075126886367798},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.4464977979660034},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4421542286872864},{"id":"https://openalex.org/keywords/contrast","display_name":"Contrast (vision)","score":0.441410094499588},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3284528851509094},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.0941472053527832},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09327724575996399}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7902147769927979},{"id":"https://openalex.org/C150506046","wikidata":"https://www.wikidata.org/wiki/Q6667822","display_name":"Logos Bible Software","level":2,"score":0.6642200350761414},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.5356191396713257},{"id":"https://openalex.org/C2778720087","wikidata":"https://www.wikidata.org/wiki/Q201436","display_name":"Logo (programming language)","level":2,"score":0.5324994325637817},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.5075126886367798},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4464977979660034},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4421542286872864},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.441410094499588},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3284528851509094},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0941472053527832},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09327724575996399},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3474085.3475525","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3474085.3475525","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Multimedia","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2301.06629","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2301.06629","pdf_url":"https://arxiv.org/pdf/2301.06629","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2301.06629","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2301.06629","pdf_url":"https://arxiv.org/pdf/2301.06629","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8100000023841858,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3207441221.pdf","grobid_xml":"https://content.openalex.org/works/W3207441221.grobid-xml"},"referenced_works_count":40,"referenced_works":["https://openalex.org/W566667199","https://openalex.org/W1536598138","https://openalex.org/W1579853615","https://openalex.org/W1605527696","https://openalex.org/W1810943226","https://openalex.org/W1959608418","https://openalex.org/W1967011969","https://openalex.org/W1990284337","https://openalex.org/W2081605477","https://openalex.org/W2148985659","https://openalex.org/W2216735140","https://openalex.org/W2557519264","https://openalex.org/W2703190149","https://openalex.org/W2765874585","https://openalex.org/W2793483732","https://openalex.org/W2798788395","https://openalex.org/W2884948865","https://openalex.org/W2885024018","https://openalex.org/W2891790128","https://openalex.org/W2948479456","https://openalex.org/W2950802180","https://openalex.org/W2960053204","https://openalex.org/W2963184176","https://openalex.org/W2963522749","https://openalex.org/W2963601843","https://openalex.org/W2963842958","https://openalex.org/W2963981733","https://openalex.org/W2967177252","https://openalex.org/W2985299701","https://openalex.org/W3000176874","https://openalex.org/W3003711898","https://openalex.org/W3015225138","https://openalex.org/W3035050475","https://openalex.org/W3093772859","https://openalex.org/W3112646048","https://openalex.org/W3201409833","https://openalex.org/W4288627824","https://openalex.org/W4299510085","https://openalex.org/W4301504317","https://openalex.org/W4320013936"],"related_works":["https://openalex.org/W2946658881","https://openalex.org/W2112896459","https://openalex.org/W2026754580","https://openalex.org/W3198749917","https://openalex.org/W2085407156","https://openalex.org/W2098050557","https://openalex.org/W654432377","https://openalex.org/W1993445589","https://openalex.org/W4212899853","https://openalex.org/W2990113118"],"abstract_inverted_index":{"Designing":[0],"visually":[1],"appealing":[2],"layouts":[3,22,48,82,177,192],"for":[4,165],"multimedia":[5],"documents":[6],"containing":[7],"text,":[8],"graphs":[9],"and":[10,33,141,175,204,219],"images":[11],"requires":[12],"a":[13,44,56,84,106,120,160,179],"form":[14,115],"of":[15,21,46,162],"creative":[16],"intelligence.":[17],"Modelling":[18],"the":[19,63,70,102,110,123,151],"generation":[20],"has":[23],"recently":[24],"gained":[25],"attention":[26],"due":[27],"to":[28,38,144,158,172,226],"its":[29],"importance":[30],"in":[31,122,184,224],"aesthetics":[32],"communication":[34],"style.":[35],"In":[36,89,109,125],"contrast":[37,185],"standard":[39],"prediction":[40,87,140],"tasks,":[41],"there":[42],"are":[43,73],"range":[45,161],"acceptable":[47],"which":[49,182,189],"depend":[50],"on":[51,62,69,199],"user":[52],"preferences.":[53],"For":[54],"example,":[55,112],"poster":[57],"designer":[58],"may":[59],"prefer":[60],"logos":[61,68],"top-left":[64],"while":[65],"another":[66],"prefers":[67],"bottom-right.":[71],"Both":[72],"correct":[74],"choices":[75,100],"yet":[76],"existing":[77,187,227],"machine":[78],"learning":[79],"models":[80,93],"treat":[81],"as":[83],"single":[85,180],"choice":[86],"problem.":[88],"such":[90],"situations,":[91],"these":[92],"would":[94,114],"simply":[95],"average":[96],"over":[97],"all":[98],"possible":[99,163],"given":[101],"same":[103],"input":[104,181],"forming":[105],"degenerate":[107],"sample.":[108],"above":[111],"this":[113,126],"an":[116,130],"unacceptable":[117],"layout":[118,147,167],"with":[119,186,193],"logo":[121],"centre.":[124],"paper,":[127],"we":[128,208],"present":[129],"auto-regressive":[131],"neural":[132],"network":[133],"architecture,":[134],"called":[135],"LayoutMCL,":[136],"that":[137,210],"uses":[138],"multi-choice":[139],"winner-takes-all":[142],"loss":[143],"effectively":[145],"stabilise":[146],"generation.":[148],"LayoutMCL":[149,171,211],"avoids":[150],"averaging":[152],"problem":[153],"by":[154,217],"using":[155],"multiple":[156,174],"predictors":[157],"learn":[159],"options":[164],"each":[166],"object.":[168],"This":[169],"enables":[170],"generate":[173],"diverse":[176],"from":[178],"is":[183],"approaches":[188],"yield":[190],"similar":[191],"minor":[194],"variations.":[195],"Through":[196],"quantitative":[197],"benchmarks":[198],"real":[200],"data":[201],"(magazine,":[202],"document":[203],"mobile":[205],"app":[206],"layouts),":[207],"demonstrate":[209],"reduces":[212],"Fr\\'echet":[213],"Inception":[214],"Distance":[215],"(FID)":[216],"83-98%":[218],"generates":[220],"significantly":[221],"more":[222],"diversity":[223],"comparison":[225],"approaches.":[228]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
