{"id":"https://openalex.org/W4387969239","doi":"https://doi.org/10.1145/3581783.3612678","title":"3D Creation at Your Fingertips: From Text or Image to 3D Assets","display_name":"3D Creation at Your Fingertips: From Text or Image to 3D Assets","publication_year":2023,"publication_date":"2023-10-26","ids":{"openalex":"https://openalex.org/W4387969239","doi":"https://doi.org/10.1145/3581783.3612678"},"language":"en","primary_location":{"id":"doi:10.1145/3581783.3612678","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3581783.3612678","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5083113249","display_name":"Yang Chen","orcid":"https://orcid.org/0009-0001-9058-5051"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yang Chen","raw_affiliation_strings":["University of Science and Technology of China, Hefei, China"],"raw_orcid":"https://orcid.org/0009-0001-9058-5051","affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027796698","display_name":"Jingwen Chen","orcid":"https://orcid.org/0000-0002-7917-6003"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingwen Chen","raw_affiliation_strings":["Sun Yat-sen University, Guangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-7917-6003","affiliations":[{"raw_affiliation_string":"Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085403640","display_name":"Yingwei Pan","orcid":"https://orcid.org/0000-0002-4344-8898"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yingwei Pan","raw_affiliation_strings":["University of Science and Technology of China, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0002-4344-8898","affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071510961","display_name":"Xinmei Tian","orcid":"https://orcid.org/0000-0002-5952-8753"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinmei Tian","raw_affiliation_strings":["University of Science and Technology of China, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0002-5952-8753","affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101517779","display_name":"Tao Mei","orcid":"https://orcid.org/0000-0002-5990-7307"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tao Mei","raw_affiliation_strings":["HiDream.ai Inc., Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-5990-7307","affiliations":[{"raw_affiliation_string":"HiDream.ai Inc., Beijing, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5083113249"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":1.4494,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.79072013,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"9408","last_page":"9410"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8414335250854492},{"id":"https://openalex.org/keywords/initialization","display_name":"Initialization","score":0.6147332787513733},{"id":"https://openalex.org/keywords/3d-modeling","display_name":"3D modeling","score":0.5424053072929382},{"id":"https://openalex.org/keywords/upload","display_name":"Upload","score":0.5276459455490112},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4855877757072449},{"id":"https://openalex.org/keywords/3d-model","display_name":"3d model","score":0.48063865303993225},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4557156562805176},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44294002652168274},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.3813055157661438},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.15624138712882996},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.1090516448020935}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8414335250854492},{"id":"https://openalex.org/C114466953","wikidata":"https://www.wikidata.org/wiki/Q6034165","display_name":"Initialization","level":2,"score":0.6147332787513733},{"id":"https://openalex.org/C2777897806","wikidata":"https://www.wikidata.org/wiki/Q568742","display_name":"3D modeling","level":2,"score":0.5424053072929382},{"id":"https://openalex.org/C71901391","wikidata":"https://www.wikidata.org/wiki/Q7126699","display_name":"Upload","level":2,"score":0.5276459455490112},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4855877757072449},{"id":"https://openalex.org/C3019007443","wikidata":"https://www.wikidata.org/wiki/Q568742","display_name":"3d model","level":2,"score":0.48063865303993225},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4557156562805176},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44294002652168274},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.3813055157661438},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.15624138712882996},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.1090516448020935}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3581783.3612678","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3581783.3612678","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.8399999737739563}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":5,"referenced_works":["https://openalex.org/W2981876524","https://openalex.org/W2982192816","https://openalex.org/W3183430956","https://openalex.org/W3213433499","https://openalex.org/W4366352791"],"related_works":["https://openalex.org/W2708417971","https://openalex.org/W2314700393","https://openalex.org/W4384469254","https://openalex.org/W2563904947","https://openalex.org/W3116009112","https://openalex.org/W3036892807","https://openalex.org/W2995646374","https://openalex.org/W2983578059","https://openalex.org/W1970233280","https://openalex.org/W4244364093"],"abstract_inverted_index":{"We":[0,66],"demonstrate":[1],"an":[2],"automatic":[3],"3D":[4,11,24,58,89,105,138,166],"creation":[5,167],"system,":[6],"which":[7,124],"can":[8,28,118],"create":[9,119],"realistic":[10],"assets":[12,139],"solely":[13],"from":[14,111],"a":[15,40,56,68,79,85,102,157],"text":[16,146],"or":[17,38,147],"image":[18,42,148],"prompt":[19],"without":[20],"requiring":[21],"any":[22],"specialized":[23],"modeling":[25],"skills.":[26],"Users":[27],"either":[29],"describe":[30],"the":[31,50,63,97,132,136,144],"object":[32],"they":[33,46],"envision":[34],"in":[35,122],"natural":[36],"language":[37],"upload":[39],"reference":[41],"that":[43,60,135],"records":[44],"what":[45],"have":[47],"seen":[48],"with":[49,107,143],"phone.":[51],"Our":[52,116],"system":[53,117,133],"will":[54],"generate":[55],"high-quality":[57],"mesh":[59,81,95,106],"faithfully":[61],"matches":[62],"users'":[64],"input.":[65],"propose":[67],"coarse-to-fine":[69],"framework":[70],"to":[71,164],"achieve":[72],"this":[73],"goal.":[74],"Specifically,":[75],"we":[76,99],"first":[77],"obtain":[78],"low-resolution":[80],"instantly":[82],"by":[83],"utilizing":[84],"pre-trained":[86],"text/image":[87],"conditional":[88],"generative":[90],"model.":[91],"Using":[92],"such":[93],"coarse":[94],"as":[96],"initialization,":[98],"further":[100],"optimize":[101],"high-resolution":[103],"textured":[104],"fine-grained":[108],"appearance":[109],"guidance":[110],"large-scale":[112],"2D":[113],"diffusion":[114],"models.":[115],"visually-pleasing":[120],"results":[121],"minutes,":[123],"is":[125],"significantly":[126],"faster":[127],"than":[128],"existing":[129],"methods.":[130],"Meanwhile,":[131],"ensures":[134],"resulting":[137],"are":[140],"precisely":[141],"aligned":[142],"input":[145],"prompt.":[149],"With":[150],"these":[151],"advanced":[152],"capabilities,":[153],"our":[154],"demonstration":[155],"provides":[156],"streamlined":[158],"and":[159],"intuitive":[160],"platform":[161],"for":[162],"users":[163],"incorporate":[165],"into":[168],"their":[169],"daily":[170],"lives.":[171]},"counts_by_year":[{"year":2024,"cited_by_count":7}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
