{"id":"https://openalex.org/W4403791153","doi":"https://doi.org/10.1145/3664647.3681185","title":"InstantAS: Minimum Coverage Sampling for Arbitrary-Size Image Generation","display_name":"InstantAS: Minimum Coverage Sampling for Arbitrary-Size Image Generation","publication_year":2024,"publication_date":"2024-10-26","ids":{"openalex":"https://openalex.org/W4403791153","doi":"https://doi.org/10.1145/3664647.3681185"},"language":"en","primary_location":{"id":"doi:10.1145/3664647.3681185","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3681185","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039327013","display_name":"Changshuo Wang","orcid":"https://orcid.org/0000-0002-9970-191X"},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Changshuo Wang","raw_affiliation_strings":["Shandong University, Jinan, Shandong, China"],"affiliations":[{"raw_affiliation_string":"Shandong University, Jinan, Shandong, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009433044","display_name":"Mingzhe Yu","orcid":"https://orcid.org/0009-0005-3793-0847"},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingzhe Yu","raw_affiliation_strings":["Shandong University, Jinan, Shandong, China"],"affiliations":[{"raw_affiliation_string":"Shandong University, Jinan, Shandong, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068636370","display_name":"Lei Wu","orcid":"https://orcid.org/0000-0002-3872-9062"},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Wu","raw_affiliation_strings":["Shandong University, Jinan, Shandong, China"],"affiliations":[{"raw_affiliation_string":"Shandong University, Jinan, Shandong, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100629169","display_name":"Lei Meng","orcid":"https://orcid.org/0000-0002-0273-5946"},"institutions":[{"id":"https://openalex.org/I119203015","display_name":"Shandong University of Technology","ror":"https://ror.org/02mr3ar13","country_code":"CN","type":"education","lineage":["https://openalex.org/I119203015"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Meng","raw_affiliation_strings":["Shandong University &amp; Shandong Research Institute of Industrial Technology, Jinan, Shandong, China"],"affiliations":[{"raw_affiliation_string":"Shandong University &amp; Shandong Research Institute of Industrial Technology, Jinan, Shandong, China","institution_ids":["https://openalex.org/I119203015"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103005164","display_name":"Xiang Li","orcid":"https://orcid.org/0000-0003-3828-9834"},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiang Li","raw_affiliation_strings":["Shandong University, Jinan, Shandong, China"],"affiliations":[{"raw_affiliation_string":"Shandong University, Jinan, Shandong, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101536417","display_name":"Xiangxu Meng","orcid":"https://orcid.org/0000-0001-7290-5659"},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiangxu Meng","raw_affiliation_strings":["Shandong University, Jinan, Shandong, China"],"affiliations":[{"raw_affiliation_string":"Shandong University, Jinan, Shandong, China","institution_ids":["https://openalex.org/I154099455"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5039327013"],"corresponding_institution_ids":["https://openalex.org/I154099455"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.18476931,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"3180","last_page":"3188"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.638124942779541},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.528801679611206},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5211727023124695},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3426673710346222}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.638124942779541},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.528801679611206},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5211727023124695},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3426673710346222},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3664647.3681185","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3681185","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W2183341477","https://openalex.org/W2962770929","https://openalex.org/W2962793481","https://openalex.org/W2963073614","https://openalex.org/W2963800363","https://openalex.org/W3034839660","https://openalex.org/W3035574324","https://openalex.org/W3036167779","https://openalex.org/W3096831136","https://openalex.org/W3180355996","https://openalex.org/W4246999471","https://openalex.org/W4300424419","https://openalex.org/W4306820534","https://openalex.org/W4312694728","https://openalex.org/W4312933868","https://openalex.org/W4321276804","https://openalex.org/W4386057725","https://openalex.org/W4386072096","https://openalex.org/W4386083141","https://openalex.org/W6779823529"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"diffusion":[3,20,46,127],"models":[4,21,47],"have":[5],"dominated":[6],"the":[7,52,69,84,88,100,103,109,116,119,124,133,138,146],"field":[8],"of":[9,90,102,118,126,132,148],"image":[10,74,121,167],"generation":[11,15,89,168],"with":[12],"their":[13,32],"outstanding":[14],"quality.":[16],"However,":[17],"pre-trained":[18],"large-scale":[19],"are":[22],"generally":[23],"trained":[24],"using":[25,151],"fixed-size":[26],"images,":[27],"and":[28,62,93,122,170],"fail":[29],"to":[30,114,164,178],"maintain":[31,99],"performance":[33],"at":[34],"different":[35,130,149,152],"aspect":[36],"ratios.":[37],"Existing":[38],"methods":[39,169],"for":[40,54,72,145],"generating":[41],"arbitrary-size":[42,73,166],"images":[43],"based":[44],"on":[45,83],"face":[48],"several":[49],"issues,":[50],"including":[51],"requirement":[53],"extensive":[55],"finetuning":[56],"or":[57],"training,":[58],"sluggish":[59],"sampling":[60,96,175],"speed,":[61],"noticeable":[63],"edge":[64],"artifacts.":[65],"This":[66,76],"paper":[67],"presents":[68],"InstantAS":[70,158],"method":[71,77,113],"generation.":[75],"performs":[78],"non-overlapping":[79],"minimum":[80],"coverage":[81],"segmentation":[82],"target":[85],"image,":[86,105],"minimizing":[87],"redundant":[91],"information":[92],"significantly":[94],"improving":[95],"speed.":[97],"To":[98],"consistency":[101],"generated":[104],"we":[106,136],"also":[107],"proposed":[108],"Inter-Domain":[110],"Distribution":[111],"Bridging":[112],"integrate":[115],"distribution":[117],"entire":[120],"suppress":[123],"separation":[125],"paths":[128],"in":[129,174],"regions":[131,150],"image.":[134],"Furthermore,":[135],"propose":[137],"dynamic":[139],"semantic":[140],"guided":[141],"cross-attention":[142],"method,":[143],"allowing":[144],"control":[147],"semantics.":[153],"Experimental":[154],"results":[155],"show":[156],"that":[157],"has":[159],"better":[160],"fusion":[161],"capabilities":[162],"compared":[163,177],"previous":[165],"is":[171],"far":[172],"ahead":[173],"speed":[176],"them.":[179]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
