{"id":"https://openalex.org/W4386615379","doi":"https://doi.org/10.1109/icip49359.2023.10222155","title":"ICCL: Self-Supervised Intra- and Cross-Modal Contrastive Learning with 2D-3D Pairs for 3D Scene Understanding","display_name":"ICCL: Self-Supervised Intra- and Cross-Modal Contrastive Learning with 2D-3D Pairs for 3D Scene Understanding","publication_year":2023,"publication_date":"2023-09-11","ids":{"openalex":"https://openalex.org/W4386615379","doi":"https://doi.org/10.1109/icip49359.2023.10222155"},"language":"en","primary_location":{"id":"doi:10.1109/icip49359.2023.10222155","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icip49359.2023.10222155","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Image Processing (ICIP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058678583","display_name":"Kyota Higa","orcid":"https://orcid.org/0009-0008-0526-9662"},"institutions":[{"id":"https://openalex.org/I118347220","display_name":"NEC (Japan)","ror":"https://ror.org/04jndar25","country_code":"JP","type":"company","lineage":["https://openalex.org/I118347220"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Kyota Higa","raw_affiliation_strings":["NEC Corporation,Visual Intelligence Research Laboratories,Kawasaki, Kanagawa,Japan","Visual Intelligence Research Laboratories, NEC Corporation, Kawasaki, Kanagawa, Japan"],"affiliations":[{"raw_affiliation_string":"NEC Corporation,Visual Intelligence Research Laboratories,Kawasaki, Kanagawa,Japan","institution_ids":["https://openalex.org/I118347220"]},{"raw_affiliation_string":"Visual Intelligence Research Laboratories, NEC Corporation, Kawasaki, Kanagawa, Japan","institution_ids":["https://openalex.org/I118347220"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009394089","display_name":"Masahiro Yamaguchi","orcid":"https://orcid.org/0000-0003-1001-4505"},"institutions":[{"id":"https://openalex.org/I118347220","display_name":"NEC (Japan)","ror":"https://ror.org/04jndar25","country_code":"JP","type":"company","lineage":["https://openalex.org/I118347220"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Masahiro Yamaguchi","raw_affiliation_strings":["NEC Corporation,Visual Intelligence Research Laboratories,Kawasaki, Kanagawa,Japan","Visual Intelligence Research Laboratories, NEC Corporation, Kawasaki, Kanagawa, Japan"],"affiliations":[{"raw_affiliation_string":"NEC Corporation,Visual Intelligence Research Laboratories,Kawasaki, Kanagawa,Japan","institution_ids":["https://openalex.org/I118347220"]},{"raw_affiliation_string":"Visual Intelligence Research Laboratories, NEC Corporation, Kawasaki, Kanagawa, Japan","institution_ids":["https://openalex.org/I118347220"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5110507817","display_name":"Toshinori Hosoi","orcid":null},"institutions":[{"id":"https://openalex.org/I118347220","display_name":"NEC (Japan)","ror":"https://ror.org/04jndar25","country_code":"JP","type":"company","lineage":["https://openalex.org/I118347220"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Toshinori Hosoi","raw_affiliation_strings":["NEC Corporation,Visual Intelligence Research Laboratories,Kawasaki, Kanagawa,Japan","Visual Intelligence Research Laboratories, NEC Corporation, Kawasaki, Kanagawa, Japan"],"affiliations":[{"raw_affiliation_string":"NEC Corporation,Visual Intelligence Research Laboratories,Kawasaki, Kanagawa,Japan","institution_ids":["https://openalex.org/I118347220"]},{"raw_affiliation_string":"Visual Intelligence Research Laboratories, NEC Corporation, Kawasaki, Kanagawa, Japan","institution_ids":["https://openalex.org/I118347220"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5058678583"],"corresponding_institution_ids":["https://openalex.org/I118347220"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.11153361,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"119","issue":null,"first_page":"1085","last_page":"1089"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11211","display_name":"3D Surveying and Cultural Heritage","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1907","display_name":"Geology"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.797765851020813},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7130082845687866},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6544216871261597},{"id":"https://openalex.org/keywords/transferability","display_name":"Transferability","score":0.5841736793518066},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5648859739303589},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.5638390779495239},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5520871877670288},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.528785765171051},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5232112407684326},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5207490921020508},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.5190261602401733},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.4198874235153198},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.41869598627090454},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3570104241371155},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.109352707862854}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.797765851020813},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7130082845687866},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6544216871261597},{"id":"https://openalex.org/C61272859","wikidata":"https://www.wikidata.org/wiki/Q7834031","display_name":"Transferability","level":3,"score":0.5841736793518066},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5648859739303589},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.5638390779495239},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5520871877670288},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.528785765171051},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5232112407684326},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5207490921020508},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.5190261602401733},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.4198874235153198},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.41869598627090454},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3570104241371155},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.109352707862854},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C140331021","wikidata":"https://www.wikidata.org/wiki/Q1868104","display_name":"Logit","level":2,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icip49359.2023.10222155","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icip49359.2023.10222155","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Image Processing (ICIP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W1920022804","https://openalex.org/W2187089797","https://openalex.org/W2194775991","https://openalex.org/W2553307952","https://openalex.org/W2619697695","https://openalex.org/W2962960500","https://openalex.org/W2979750740","https://openalex.org/W2981440248","https://openalex.org/W2991485494","https://openalex.org/W3109931228","https://openalex.org/W3128716822","https://openalex.org/W3178738710","https://openalex.org/W3182683290","https://openalex.org/W3197097949","https://openalex.org/W3202611145","https://openalex.org/W3206846540","https://openalex.org/W6631190155","https://openalex.org/W6687484953","https://openalex.org/W6726497184","https://openalex.org/W6739778489","https://openalex.org/W6763103765","https://openalex.org/W6763236253","https://openalex.org/W6763422710","https://openalex.org/W6774314701","https://openalex.org/W6783272290","https://openalex.org/W6809733949"],"related_works":["https://openalex.org/W4399895933","https://openalex.org/W2161221533","https://openalex.org/W4229699405","https://openalex.org/W1666484574","https://openalex.org/W2216382288","https://openalex.org/W2355491300","https://openalex.org/W4234629551","https://openalex.org/W2011110943","https://openalex.org/W2440023763","https://openalex.org/W2962474440"],"abstract_inverted_index":{"This":[0],"paper":[1],"proposes":[2],"self-supervised":[3,26],"intra-":[4],"and":[5,44,54,89,108,111,126,149],"cross-modal":[6],"contrastive":[7,38,56,63],"learning":[8,72,154],"(ICCL)":[9],"with":[10,33,48],"2D-3D":[11,45,55],"pairs":[12],"for":[13,146],"3D":[14,53,96,150],"scene":[15],"understanding.":[16],"Learning":[17],"from":[18],"different":[19],"modalities":[20],"has":[21],"produced":[22],"substantial":[23],"results":[24,93,120],"in":[25,65,165],"learning.":[27],"Our":[28],"method":[29,59],"learns":[30],"a":[31,49,61,73],"model":[32],"high":[34],"transferability":[35,80],"by":[36,81],"minimizing":[37,52],"losses":[39],"based":[40],"on":[41],"2D,":[42],"3D,":[43],"features.":[46],"Compared":[47],"conventional":[50,117,140],"approach":[51,102],"losses,":[57],"our":[58,101,132],"minimizes":[60],"2D":[62,147],"loss":[64],"addition":[66],"to":[67,71,136],"them.":[68],"It":[69],"leads":[70],"better":[74,143],"feature":[75,144],"representation.":[76],"We":[77],"evaluate":[78],"the":[79,95,116,122,127,160],"conducting":[82],"three":[83],"downstream":[84],"tasks,":[85],"including":[86],"object":[87,97,124],"classification":[88,98,125],"part":[90,128],"segmentation.":[91],"The":[92,119],"of":[94,106,121,162],"show":[99,130],"that":[100,131],"achieves":[103],"an":[104],"accuracy":[105,133],"91.7":[107],"85.4":[109],"(0.5":[110],"3.7":[112],"points":[113],"higher":[114,138],"than":[115,139],"method).":[118],"few-shot":[123],"segmentation":[129],"is":[134],"equal":[135],"or":[137],"methods.":[141],"With":[142],"representation":[145],"images":[148],"point":[151],"clouds,":[152],"transfer":[153],"can":[155],"be":[156],"more":[157],"accessible,":[158],"enabling":[159],"implementation":[161],"various":[163],"applications":[164],"many":[166],"fields.":[167]},"counts_by_year":[],"updated_date":"2025-12-21T01:58:51.020947","created_date":"2025-10-10T00:00:00"}
