{"id":"https://openalex.org/W4411472261","doi":"https://doi.org/10.1109/tmm.2025.3581776","title":"WI3D: Weakly Incremental 3D Detection via Vision Foundation Models","display_name":"WI3D: Weakly Incremental 3D Detection via Vision Foundation Models","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4411472261","doi":"https://doi.org/10.1109/tmm.2025.3581776"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2025.3581776","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3581776","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101698381","display_name":"Mingsheng Li","orcid":"https://orcid.org/0009-0004-3758-0018"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Mingsheng Li","raw_affiliation_strings":["School of Information Science and Technology, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114804332","display_name":"Sijin Chen","orcid":"https://orcid.org/0009-0008-1319-746X"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sijin Chen","raw_affiliation_strings":["School of Information Science and Technology, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014725693","display_name":"Shengji Tang","orcid":"https://orcid.org/0009-0001-3456-8310"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shengji Tang","raw_affiliation_strings":["School of Information Science and Technology, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015639955","display_name":"Hongyuan Zhu","orcid":"https://orcid.org/0000-0001-5177-8320"},"institutions":[{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]},{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Hongyuan Zhu","raw_affiliation_strings":["Institute for Infocomm Research (I R) &amp; Centre for Frontier AI Research (CFAR), A*STAR, Singapore"],"affiliations":[{"raw_affiliation_string":"Institute for Infocomm Research (I R) &amp; Centre for Frontier AI Research (CFAR), A*STAR, Singapore","institution_ids":["https://openalex.org/I3005327000","https://openalex.org/I115228651"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002275591","display_name":"Yanyan Fang","orcid":null},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanyan Fang","raw_affiliation_strings":["School of Information Science and Technology, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100363100","display_name":"Xin Chen","orcid":"https://orcid.org/0000-0002-9347-1367"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Chen","raw_affiliation_strings":["Tencent GY-Laboratory, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Tencent GY-Laboratory, Shanghai, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101625859","display_name":"Zhuoyuan Li","orcid":"https://orcid.org/0000-0002-0600-7487"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhuoyuan Li","raw_affiliation_strings":["School of Information Science and Technology, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076278944","display_name":"Fukun Yin","orcid":"https://orcid.org/0000-0003-2623-1619"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fukun Yin","raw_affiliation_strings":["School of Information Science and Technology, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5021220108","display_name":"Tao Chen","orcid":"https://orcid.org/0000-0002-0779-9818"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tao Chen","raw_affiliation_strings":["School of Information Science and Technology, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5101698381"],"corresponding_institution_ids":["https://openalex.org/I24943067"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.2330433,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"11"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.9753999710083008,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.967199981212616,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8157126903533936},{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.658252477645874},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.43311864137649536},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3564460277557373}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8157126903533936},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.658252477645874},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43311864137649536},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3564460277557373},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2025.3581776","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3581776","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Class-incremental":[0],"3D":[1,6,33,71,114],"object":[2],"detection":[3,26],"demands":[4],"a":[5,19,49,70,83,103,122,146,161],"detector":[7,72],"to":[8,73,151],"<italic":[9,13],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[10,14,54,57,60,63,66],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">locate</i>":[11],"and":[12,90,96,133,169,196,203],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">recognize</i>":[15],"novel":[16,37,84,157,185],"categories":[17],"in":[18,40,140,193],"stream":[20],"fashion":[21],"while":[22,187],"preserving":[23,188],"its":[24],"base":[25,191],"ability.":[27],"However,":[28],"existing":[29],"methods":[30],"require":[31],"delicate":[32],"annotations":[34],"for":[35,109],"learning":[36,155],"categories,":[38],"resulting":[39],"significant":[41],"labeling":[42],"costs.":[43],"To":[44],"this":[45],"end,":[46],"we":[47,144],"explore":[48],"label-efficient":[50],"approach":[51,181],"called":[52],"<bold":[53,56,59,62],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">W</b>eakly":[55],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">I</b>ncremental":[58],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">3</b>D":[61],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">D</b>etection":[64],"(<bold":[65],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">WI3D</b>),":[67],"which":[68],"teaches":[69],"learn":[74,184],"incrementally":[75],"with":[76,136,160],"off-the-shelf":[77],"vision":[78],"foundation":[79],"models.":[80],"We":[81],"propose":[82],"dual-teaching":[85],"framework":[86,101],"incorporating":[87],"both":[88,201],"intra-modal":[89],"inter-modal":[91],"knowledge":[92,148,163,171,189],"from":[93,172],"pseudo":[94,115,131],"labels":[95,132],"feature":[97],"space.":[98],"Specifically,":[99],"our":[100,180],"features":[102],"class-agnostic":[104],"pseudo-label":[105],"refinement":[106],"module,":[107],"designed":[108],"the":[110,127,153],"generation":[111],"of":[112,156,190],"high-quality":[113],"labels.":[116],"This":[117],"module":[118,150],"is":[119],"built":[120],"on":[121,200],"lightweight":[123],"transformer":[124],"that":[125,166,179],"models":[126],"spatial":[128],"relationships":[129],"between":[130],"their":[134],"interactions":[135],"rich":[137],"contextual":[138],"information":[139],"point":[141],"clouds.":[142],"Additionally,":[143],"introduce":[145],"cross-modal":[147],"transfer":[149],"enhance":[152],"representation":[154],"classes,":[158],"along":[159],"reweighting":[162],"distillation":[164],"strategy":[165],"dynamically":[167],"assesses":[168],"distills":[170],"previously":[173],"learned":[174],"categories.":[175],"Extensive":[176],"experiments":[177],"show":[178],"can":[182],"efficiently":[183],"concepts":[186],"classes":[192],"WI3D":[194],"scenarios,":[195],"surpass":[197],"baseline":[198],"approaches":[199],"SUN-RGBD":[202],"ScanNet.":[204]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
