{"id":"https://openalex.org/W4414669998","doi":"https://doi.org/10.1007/s44267-025-00089-8","title":"Hybrid Fourier score distillation for efficient one image to 3D object generation","display_name":"Hybrid Fourier score distillation for efficient one image to 3D object generation","publication_year":2025,"publication_date":"2025-09-30","ids":{"openalex":"https://openalex.org/W4414669998","doi":"https://doi.org/10.1007/s44267-025-00089-8"},"language":"en","primary_location":{"id":"doi:10.1007/s44267-025-00089-8","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s44267-025-00089-8","pdf_url":"https://link.springer.com/content/pdf/10.1007/s44267-025-00089-8.pdf","source":{"id":"https://openalex.org/S4387289164","display_name":"Visual Intelligence","issn_l":"2731-9008","issn":["2731-9008"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Visual Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://link.springer.com/content/pdf/10.1007/s44267-025-00089-8.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075107373","display_name":"Shuzhou Yang","orcid":"https://orcid.org/0009-0001-3632-9065"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shuzhou Yang","raw_affiliation_strings":["Peng Cheng Laboratory, Shenzhen, China","School of Electronic and Computer Engineering, Peking University, Shenzhen, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Peng Cheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]},{"raw_affiliation_string":"School of Electronic and Computer Engineering, Peking University, Shenzhen, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100445319","display_name":"Yu Wang","orcid":"https://orcid.org/0000-0003-0361-1563"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yu Wang","raw_affiliation_strings":["School of Electronic and Computer Engineering, Peking University, Shenzhen, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electronic and Computer Engineering, Peking University, Shenzhen, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005801079","display_name":"Haijie Li","orcid":"https://orcid.org/0000-0003-4908-4615"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haijie Li","raw_affiliation_strings":["School of Electronic and Computer Engineering, Peking University, Shenzhen, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electronic and Computer Engineering, Peking University, Shenzhen, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100594358","display_name":"Jiarui Meng","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiarui Meng","raw_affiliation_strings":["School of Electronic and Computer Engineering, Peking University, Shenzhen, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electronic and Computer Engineering, Peking University, Shenzhen, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101688674","display_name":"Yanmin Wu","orcid":"https://orcid.org/0000-0002-3926-4500"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanmin Wu","raw_affiliation_strings":["School of Electronic and Computer Engineering, Peking University, Shenzhen, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electronic and Computer Engineering, Peking University, Shenzhen, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113838311","display_name":"Xiandong Meng","orcid":null},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiandong Meng","raw_affiliation_strings":["Peng Cheng Laboratory, Shenzhen, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Peng Cheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100409856","display_name":"Jian Zhang","orcid":"https://orcid.org/0000-0001-5486-3125"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]},{"id":"https://openalex.org/I88101031","display_name":"Immersion (United States)","ror":"https://ror.org/02qgx4h83","country_code":"US","type":"company","lineage":["https://openalex.org/I88101031"]}],"countries":["CN","US"],"is_corresponding":false,"raw_author_name":"Jian Zhang","raw_affiliation_strings":["Guangdong Provincial Key Laboratory of Ultra High Definition Immersive Media Technology, Shenzhen, China","Peng Cheng Laboratory, Shenzhen, China","School of Electronic and Computer Engineering, Peking University, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0001-5486-3125","affiliations":[{"raw_affiliation_string":"Guangdong Provincial Key Laboratory of Ultra High Definition Immersive Media Technology, Shenzhen, China","institution_ids":["https://openalex.org/I88101031"]},{"raw_affiliation_string":"Peng Cheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]},{"raw_affiliation_string":"School of Electronic and Computer Engineering, Peking University, Shenzhen, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5075107373"],"corresponding_institution_ids":["https://openalex.org/I20231570","https://openalex.org/I4210136793"],"apc_list":null,"apc_paid":null,"fwci":2.8896,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.9258628,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"3","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.8758999705314636},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4569000005722046},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.45410001277923584},{"id":"https://openalex.org/keywords/fourier-transform","display_name":"Fourier transform","score":0.4153999984264374},{"id":"https://openalex.org/keywords/aliasing","display_name":"Aliasing","score":0.3783000111579895},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.37779998779296875},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3684000074863434},{"id":"https://openalex.org/keywords/frequency-domain","display_name":"Frequency domain","score":0.3553999960422516}],"concepts":[{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.8758999705314636},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6380000114440918},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6313999891281128},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.571399986743927},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4569000005722046},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.45410001277923584},{"id":"https://openalex.org/C102519508","wikidata":"https://www.wikidata.org/wiki/Q6520159","display_name":"Fourier transform","level":2,"score":0.4153999984264374},{"id":"https://openalex.org/C4069607","wikidata":"https://www.wikidata.org/wiki/Q868732","display_name":"Aliasing","level":3,"score":0.3783000111579895},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.37779998779296875},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3684000074863434},{"id":"https://openalex.org/C19118579","wikidata":"https://www.wikidata.org/wiki/Q786423","display_name":"Frequency domain","level":2,"score":0.3553999960422516},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3244999945163727},{"id":"https://openalex.org/C104065381","wikidata":"https://www.wikidata.org/wiki/Q1002535","display_name":"Geometric modeling","level":2,"score":0.3197999894618988},{"id":"https://openalex.org/C55020928","wikidata":"https://www.wikidata.org/wiki/Q3813865","display_name":"Image quality","level":3,"score":0.31360000371932983},{"id":"https://openalex.org/C141379421","wikidata":"https://www.wikidata.org/wiki/Q6094427","display_name":"Iterative reconstruction","level":2,"score":0.30720001459121704},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.3043000102043152},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.30410000681877136},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.28360000252723694},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.28220000863075256},{"id":"https://openalex.org/C181145010","wikidata":"https://www.wikidata.org/wiki/Q4418033","display_name":"Mesh generation","level":3,"score":0.2694999873638153},{"id":"https://openalex.org/C203024314","wikidata":"https://www.wikidata.org/wiki/Q1365258","display_name":"Fourier analysis","level":3,"score":0.2540999948978424}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1007/s44267-025-00089-8","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s44267-025-00089-8","pdf_url":"https://link.springer.com/content/pdf/10.1007/s44267-025-00089-8.pdf","source":{"id":"https://openalex.org/S4387289164","display_name":"Visual Intelligence","issn_l":"2731-9008","issn":["2731-9008"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Visual Intelligence","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:95b1ede5128c4939a3400f086c739f10","is_oa":true,"landing_page_url":"https://doaj.org/article/95b1ede5128c4939a3400f086c739f10","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Visual Intelligence, Vol 3, Iss 1, Pp 1-13 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1007/s44267-025-00089-8","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s44267-025-00089-8","pdf_url":"https://link.springer.com/content/pdf/10.1007/s44267-025-00089-8.pdf","source":{"id":"https://openalex.org/S4387289164","display_name":"Visual Intelligence","issn_l":"2731-9008","issn":["2731-9008"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Visual Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G822965519","display_name":null,"funder_award_id":"62372016","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4414669998.pdf"},"referenced_works_count":16,"referenced_works":["https://openalex.org/W2133665775","https://openalex.org/W2602856279","https://openalex.org/W2604292070","https://openalex.org/W2912083425","https://openalex.org/W2912500072","https://openalex.org/W2914304175","https://openalex.org/W3028314732","https://openalex.org/W3101027576","https://openalex.org/W4200150166","https://openalex.org/W4221151978","https://openalex.org/W4236573885","https://openalex.org/W4236965008","https://openalex.org/W4303574492","https://openalex.org/W4327519267","https://openalex.org/W4385318467","https://openalex.org/W4399574574"],"related_works":[],"abstract_inverted_index":{"Abstract":[0],"Single":[1],"image-to-3D":[2,188],"generation":[3,20,28,50,75,89,174,189],"is":[4,70],"pivotal":[5],"for":[6,161],"crafting":[7],"controllable":[8],"3D":[9,34,136,139,173,194],"assets.":[10],"Although":[11],"recent":[12],"inference-only":[13],"methods":[14,175],"have":[15,185],"achieved":[16],"impressive":[17],"effects,":[18],"their":[19,118],"quality":[21],"still":[22],"lags":[23],"behind":[24],"that":[25,68,204],"of":[26,57,63,77],"image":[27,49,88],"models.":[29],"We":[30,66],"attempt":[31],"to":[32,52,83,92,113,117,145,191],"leverage":[33],"geometric":[35,55,147],"priors":[36,46,62,76,140,152],"from":[37,47],"the":[38,54,58,64,74,142,154,158],"novel":[39,98],"view":[40,99],"diffusion":[41,80],"model":[42,51],"and":[43,60,176,215],"2D":[44,151],"appearance":[45,61,85,119],"an":[48,187],"combine":[53],"messages":[56],"former":[59],"latter.":[65],"note":[67],"there":[69],"a":[71,124,216],"disparity":[72],"between":[73],"these":[78],"two":[79],"models,":[81],"leading":[82],"different":[84,107],"outputs.":[86],"Specifically,":[87],"models":[90,100],"tend":[91],"deliver":[93],"more":[94],"detailed":[95],"visuals,":[96],"whereas":[97],"produce":[101,177],"consistent":[102],"yet":[103],"over-smooth":[104],"results":[105,210],"across":[106],"views.":[108],"Directly":[109],"combining":[110],"them":[111],"leads":[112],"suboptimal":[114],"effects":[115],"due":[116],"conflicts.":[120],"Hence,":[121],"we":[122,184],"propose":[123],"2D-3D":[125],"hybrid":[126],"Fourier":[127,159],"score":[128],"distillation":[129],"objective":[130],"function,":[131],"called":[132],"hy-FSD.":[133],"It":[134],"optimizes":[135],"Gaussians":[137],"using":[138],"in":[141,153],"spatial":[143],"domain":[144,156],"ensure":[146],"consistency,":[148],"while":[149],"exploiting":[150],"frequency":[155],"through":[157],"transform":[160],"better":[162],"visual":[163],"quality.":[164],"The":[165],"proposed":[166],"hy-FSD":[167],"can":[168],"be":[169],"integrated":[170],"into":[171],"existing":[172],"significant":[178],"performance":[179],"gains.":[180],"With":[181],"this":[182],"technique,":[183],"developed":[186],"pipeline":[190],"create":[192],"high-quality":[193],"objects":[195],"within":[196],"one":[197],"minute,":[198],"named":[199],"Fourier123.":[200],"Extensive":[201],"experiments":[202],"demonstrate":[203],"Fourier123":[205],"excels":[206],"at":[207],"efficiently":[208],"generating":[209],"with":[211],"rapid":[212],"convergence":[213],"speed":[214],"visually":[217],"appealing":[218],"output.":[219]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
