{"id":"https://openalex.org/W4414539379","doi":"https://doi.org/10.23919/mva65244.2025.11175082","title":"FMDP: Leveraging a Foundation Model for Dual-Pixel Disparity Estimation","display_name":"FMDP: Leveraging a Foundation Model for Dual-Pixel Disparity Estimation","publication_year":2025,"publication_date":"2025-07-26","ids":{"openalex":"https://openalex.org/W4414539379","doi":"https://doi.org/10.23919/mva65244.2025.11175082"},"language":"en","primary_location":{"id":"doi:10.23919/mva65244.2025.11175082","is_oa":false,"landing_page_url":"https://doi.org/10.23919/mva65244.2025.11175082","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 19th International Conference on Machine Vision and Applications (MVA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109791569","display_name":"Doehyung Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Doehyung Lee","raw_affiliation_strings":["Institute of Science,Tokyo,Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Science,Tokyo,Japan","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101866229","display_name":"Zhuofeng Wu","orcid":"https://orcid.org/0009-0009-9150-2869"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhuofeng Wu","raw_affiliation_strings":["Institute of Science,Tokyo,Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Science,Tokyo,Japan","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039862436","display_name":"Yusuke Monno","orcid":"https://orcid.org/0000-0001-6733-3406"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yusuke Monno","raw_affiliation_strings":["Institute of Science,Tokyo,Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Science,Tokyo,Japan","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024453747","display_name":"Masatoshi Okutomi","orcid":"https://orcid.org/0000-0001-5787-0742"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Masatoshi Okutomi","raw_affiliation_strings":["Institute of Science,Tokyo,Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Science,Tokyo,Japan","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.35807329,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10522","display_name":"Medical Imaging Techniques and Applications","score":0.7554000020027161,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T10522","display_name":"Medical Imaging Techniques and Applications","score":0.7554000020027161,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.7145000100135803},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.6967999935150146},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.6503000259399414},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.5781999826431274},{"id":"https://openalex.org/keywords/estimation","display_name":"Estimation","score":0.5414999723434448},{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.4997999966144562}],"concepts":[{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.7145000100135803},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.6967999935150146},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6901000142097473},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6693999767303467},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.6503000259399414},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.5781999826431274},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.5414999723434448},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5109999775886536},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.4997999966144562},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4169999957084656},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.3248000144958496},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.323199987411499},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2838999927043915},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2775999903678894},{"id":"https://openalex.org/C167928553","wikidata":"https://www.wikidata.org/wiki/Q1376021","display_name":"Estimation theory","level":2,"score":0.2662999927997589},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.25099998712539673}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/mva65244.2025.11175082","is_oa":false,"landing_page_url":"https://doi.org/10.23919/mva65244.2025.11175082","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 19th International Conference on Machine Vision and Applications (MVA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W2008990620","https://openalex.org/W2895076274","https://openalex.org/W2954740582","https://openalex.org/W2981612893","https://openalex.org/W3010383031","https://openalex.org/W3032997361","https://openalex.org/W3110381689","https://openalex.org/W3177732058","https://openalex.org/W4214520160","https://openalex.org/W4226265017","https://openalex.org/W4386075776","https://openalex.org/W4399563610","https://openalex.org/W4401537523","https://openalex.org/W4402727359","https://openalex.org/W4402753888"],"related_works":[],"abstract_inverted_index":{"In":[0,53],"this":[1],"paper,":[2],"we":[3],"propose":[4],"a":[5,29,49,69,83,87],"foundation-model-aided":[6],"dual-pixel":[7,19,34,88],"disparity":[8,35,89],"estimation":[9,36,90],"network,":[10],"named":[11],"FMDP,":[12],"which":[13],"leverages":[14],"the":[15,23,46,62,80],"physical":[16],"cues":[17],"from":[18,40,82],"de-focus":[20],"disparities":[21],"and":[22,105,114],"powerful":[24],"scene":[25],"priors":[26],"encoded":[27],"by":[28],"depth-estimation":[30,56],"foundation":[31,57,84],"model.":[32],"Previous":[33],"methods":[37,101],"often":[38],"suffer":[39],"limited":[41],"generalization":[42,116],"ability":[43],"due":[44],"to":[45,112,117],"lack":[47],"of":[48,64,72],"large-scale":[50],"training":[51],"dataset.":[52],"contrast,":[54],"recent":[55],"models":[58],"can":[59],"successfully":[60],"encode":[61],"features":[63,81],"diverse":[65],"real":[66,106,119],"scenes":[67],"using":[68],"huge":[70],"amount":[71],"data.":[73],"Given":[74],"this,":[75],"our":[76,96],"FMDP":[77,97],"effectively":[78],"integrates":[79],"model":[85],"into":[86],"pipeline.":[91],"Experimental":[92],"results":[93],"show":[94],"that":[95],"consistently":[98],"outperforms":[99],"prior":[100],"on":[102],"both":[103],"synthetic":[104],"scenes,":[107],"especially":[108],"demonstrating":[109],"improved":[110],"robustness":[111],"noise":[113],"strong":[115],"unseen":[118],"scenes.":[120]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
