{"id":"https://openalex.org/W7131117483","doi":"https://doi.org/10.1109/iccvw69036.2025.00295","title":"Tree Mapping with Limited Data: Fine-Tuning Foundation Models for Multimodal Fusion","display_name":"Tree Mapping with Limited Data: Fine-Tuning Foundation Models for Multimodal Fusion","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W7131117483","doi":"https://doi.org/10.1109/iccvw69036.2025.00295"},"language":null,"primary_location":{"id":"doi:10.1109/iccvw69036.2025.00295","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccvw69036.2025.00295","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision Workshops (ICCVW)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126650217","display_name":"Xiaoyan Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Xiaoyan Lu","raw_affiliation_strings":["Hong Kong Polytechnic University,Hung Hom,HongKong"],"affiliations":[{"raw_affiliation_string":"Hong Kong Polytechnic University,Hung Hom,HongKong","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5126616162","display_name":"Qihao Weng","orcid":null},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Qihao Weng","raw_affiliation_strings":["Hong Kong Polytechnic University,Hung Hom,HongKong"],"affiliations":[{"raw_affiliation_string":"Hong Kong Polytechnic University,Hung Hom,HongKong","institution_ids":["https://openalex.org/I14243506"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5126650217"],"corresponding_institution_ids":["https://openalex.org/I14243506"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.88570488,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"2829","last_page":"2834"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.08540000021457672,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.08540000021457672,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.05480000004172325,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.047600001096725464,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.5942000150680542},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.531499981880188},{"id":"https://openalex.org/keywords/spatial-analysis","display_name":"Spatial analysis","score":0.453900009393692},{"id":"https://openalex.org/keywords/sensor-fusion","display_name":"Sensor fusion","score":0.4530999958515167},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.420199990272522},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.36739999055862427},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.35370001196861267},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.33149999380111694}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7384999990463257},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5963000059127808},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.5942000150680542},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.531499981880188},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.45750001072883606},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.453900009393692},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.4530999958515167},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.420199990272522},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.3971000015735626},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.36739999055862427},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3668999969959259},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3544999957084656},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.35370001196861267},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.33149999380111694},{"id":"https://openalex.org/C62354387","wikidata":"https://www.wikidata.org/wiki/Q875399","display_name":"Boundary (topology)","level":2,"score":0.31150001287460327},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.30379998683929443},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.2930999994277954},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2791000008583069},{"id":"https://openalex.org/C2780660688","wikidata":"https://www.wikidata.org/wiki/Q25052564","display_name":"Multimodal learning","level":2,"score":0.2775999903678894},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.27630001306533813},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.2727000117301941},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.26440000534057617},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2615000009536743},{"id":"https://openalex.org/C183365957","wikidata":"https://www.wikidata.org/wiki/Q17140402","display_name":"Remote sensing application","level":3,"score":0.25110000371932983}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iccvw69036.2025.00295","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccvw69036.2025.00295","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision Workshops (ICCVW)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W2735039185","https://openalex.org/W4313156423","https://openalex.org/W4322766882","https://openalex.org/W4390874379","https://openalex.org/W4390874514","https://openalex.org/W4390874575","https://openalex.org/W4401608269","https://openalex.org/W4404294084","https://openalex.org/W4408634392","https://openalex.org/W4415798746"],"related_works":[],"abstract_inverted_index":{"Tree":[0],"mapping":[1,18],"plays":[2],"a":[3,40,129],"crucial":[4],"role":[5],"in":[6,29,125],"remote":[7,31,72],"sensing":[8,32,73],"for":[9,132],"ecological":[10],"monitoring":[11],"and":[12,36,58,82,104,134],"resource":[13],"management.":[14],"Achieving":[15],"accurate":[16],"tree":[17,52],"relies":[19],"on":[20],"labeled":[21],"training":[22,109],"data,":[23,84],"however,":[24],"annotating":[25],"geometrically":[26],"complex":[27],"trees":[28],"large-scale":[30],"imagery":[33],"is":[34],"time-consuming":[35],"labor-intensive.":[37],"We":[38],"propose":[39],"multimodal":[41,120],"fusion":[42],"framework":[43],"that":[44,96],"leverages":[45],"fine-tuned":[46],"foundation":[47],"models":[48],"to":[49,122],"enable":[50],"data-efficient":[51],"mapping.":[53],"To":[54],"enhance":[55],"spatial":[56],"understanding":[57],"structural":[59],"perception,":[60],"we":[61],"introduce":[62],"depth":[63,81,98],"information":[64,99],"as":[65],"an":[66],"auxiliary":[67],"modality":[68],"alongside":[69],"high-resolution":[70],"RGB":[71],"imagery.":[74],"By":[75],"leveraging":[76],"the":[77,88,116],"complementary":[78],"strengths":[79],"of":[80,90,118],"visual":[83],"our":[85],"method":[86],"mitigates":[87],"limitations":[89],"unimodal":[91],"inputs.":[92],"Experimental":[93],"results":[94],"demonstrate":[95],"integrating":[97],"significantly":[100],"improves":[101],"recognition":[102],"accuracy":[103],"boundary":[105],"delineation,":[106],"particularly":[107],"when":[108],"samples":[110],"are":[111],"scarce.":[112],"This":[113],"work":[114],"highlights":[115],"potential":[117],"depth-aware":[119],"learning":[121],"boost":[123],"performance":[124],"data-constrained":[126],"scenarios,":[127],"offering":[128],"promising":[130],"direction":[131],"scalable":[133],"cost-efficient":[135],"environmental":[136],"monitoring.":[137]},"counts_by_year":[],"updated_date":"2026-02-25T06:17:34.324206","created_date":"2026-02-24T00:00:00"}
