{"id":"https://openalex.org/W7124990955","doi":"https://doi.org/10.1109/cbmi66578.2025.11339297","title":"FPN-Based Multi-Scale Feature Fusion for Robust 3D Pedestrian Detection in Crowded Scenes","display_name":"FPN-Based Multi-Scale Feature Fusion for Robust 3D Pedestrian Detection in Crowded Scenes","publication_year":2025,"publication_date":"2025-10-22","ids":{"openalex":"https://openalex.org/W7124990955","doi":"https://doi.org/10.1109/cbmi66578.2025.11339297"},"language":null,"primary_location":{"id":"doi:10.1109/cbmi66578.2025.11339297","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cbmi66578.2025.11339297","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Content-Based Multimedia Indexing (CBMI)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050147976","display_name":"Kiyotaka Matsue","orcid":"https://orcid.org/0000-0002-1621-798X"},"institutions":[{"id":"https://openalex.org/I1292669757","display_name":"Toshiba (Japan)","ror":"https://ror.org/0326v3z14","country_code":"JP","type":"company","lineage":["https://openalex.org/I1292669757"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Kiyotaka Matsue","raw_affiliation_strings":["Infrastructure Systems R&#x0026;D Center, Toshiba Corporation,Tokyo,Japan"],"affiliations":[{"raw_affiliation_string":"Infrastructure Systems R&#x0026;D Center, Toshiba Corporation,Tokyo,Japan","institution_ids":["https://openalex.org/I1292669757"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093478913","display_name":"Kenta Umene","orcid":null},"institutions":[{"id":"https://openalex.org/I1292669757","display_name":"Toshiba (Japan)","ror":"https://ror.org/0326v3z14","country_code":"JP","type":"company","lineage":["https://openalex.org/I1292669757"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kenta Umene","raw_affiliation_strings":["Infrastructure Systems R&#x0026;D Center, Toshiba Corporation,Tokyo,Japan"],"affiliations":[{"raw_affiliation_string":"Infrastructure Systems R&#x0026;D Center, Toshiba Corporation,Tokyo,Japan","institution_ids":["https://openalex.org/I1292669757"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123370838","display_name":"Nghia Dao","orcid":null},"institutions":[{"id":"https://openalex.org/I1292669757","display_name":"Toshiba (Japan)","ror":"https://ror.org/0326v3z14","country_code":"JP","type":"company","lineage":["https://openalex.org/I1292669757"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Nghia Dao","raw_affiliation_strings":["Toshiba Software Development (Vietnam),Core Technology Dept.,Hanoi,Vietnam"],"affiliations":[{"raw_affiliation_string":"Toshiba Software Development (Vietnam),Core Technology Dept.,Hanoi,Vietnam","institution_ids":["https://openalex.org/I1292669757"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123449167","display_name":"Hieu Nguyen","orcid":null},"institutions":[{"id":"https://openalex.org/I1292669757","display_name":"Toshiba (Japan)","ror":"https://ror.org/0326v3z14","country_code":"JP","type":"company","lineage":["https://openalex.org/I1292669757"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hieu Nguyen","raw_affiliation_strings":["Toshiba Software Development (Vietnam),Core Technology Dept.,Hanoi,Vietnam"],"affiliations":[{"raw_affiliation_string":"Toshiba Software Development (Vietnam),Core Technology Dept.,Hanoi,Vietnam","institution_ids":["https://openalex.org/I1292669757"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060053741","display_name":"Manh Thuong Phan","orcid":null},"institutions":[{"id":"https://openalex.org/I1292669757","display_name":"Toshiba (Japan)","ror":"https://ror.org/0326v3z14","country_code":"JP","type":"company","lineage":["https://openalex.org/I1292669757"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Manh Phan","raw_affiliation_strings":["Toshiba Software Development (Vietnam),Core Technology Dept.,Hanoi,Vietnam"],"affiliations":[{"raw_affiliation_string":"Toshiba Software Development (Vietnam),Core Technology Dept.,Hanoi,Vietnam","institution_ids":["https://openalex.org/I1292669757"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5050147976"],"corresponding_institution_ids":["https://openalex.org/I1292669757"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.70266779,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.8984000086784363,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.8984000086784363,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.014100000262260437,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11606","display_name":"Infrastructure Maintenance and Monitoring","score":0.008899999782443047,"subfield":{"id":"https://openalex.org/subfields/2205","display_name":"Civil and Structural Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pedestrian-detection","display_name":"Pedestrian detection","score":0.8637999892234802},{"id":"https://openalex.org/keywords/pedestrian","display_name":"Pedestrian","score":0.7731000185012817},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.7056999802589417},{"id":"https://openalex.org/keywords/point-cloud","display_name":"Point cloud","score":0.6298999786376953},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5777999758720398},{"id":"https://openalex.org/keywords/pyramid","display_name":"Pyramid (geometry)","score":0.5713000297546387},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4832000136375427},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.43230000138282776},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.3756999969482422}],"concepts":[{"id":"https://openalex.org/C2780156472","wikidata":"https://www.wikidata.org/wiki/Q2355550","display_name":"Pedestrian detection","level":3,"score":0.8637999892234802},{"id":"https://openalex.org/C2777113093","wikidata":"https://www.wikidata.org/wiki/Q221488","display_name":"Pedestrian","level":2,"score":0.7731000185012817},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7501999735832214},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7120000123977661},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.7056999802589417},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6771000027656555},{"id":"https://openalex.org/C131979681","wikidata":"https://www.wikidata.org/wiki/Q1899648","display_name":"Point cloud","level":2,"score":0.6298999786376953},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5777999758720398},{"id":"https://openalex.org/C142575187","wikidata":"https://www.wikidata.org/wiki/Q3358290","display_name":"Pyramid (geometry)","level":2,"score":0.5713000297546387},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4832000136375427},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.43230000138282776},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.3756999969482422},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.3752000033855438},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3659999966621399},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.36149999499320984},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.323199987411499},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.30959999561309814},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3018999993801117},{"id":"https://openalex.org/C88796919","wikidata":"https://www.wikidata.org/wiki/Q1142907","display_name":"Backbone network","level":2,"score":0.29260000586509705},{"id":"https://openalex.org/C126422989","wikidata":"https://www.wikidata.org/wiki/Q93586","display_name":"Feature detection (computer vision)","level":4,"score":0.2775000035762787},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.2639999985694885},{"id":"https://openalex.org/C71681937","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object-class detection","level":5,"score":0.2621999979019165},{"id":"https://openalex.org/C2776650193","wikidata":"https://www.wikidata.org/wiki/Q264661","display_name":"Obstacle","level":2,"score":0.2551000118255615},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.25189998745918274}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cbmi66578.2025.11339297","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cbmi66578.2025.11339297","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Content-Based Multimedia Indexing (CBMI)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8378028869628906,"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W2565639579","https://openalex.org/W2897529137","https://openalex.org/W2967324759","https://openalex.org/W2968296999","https://openalex.org/W3034429258","https://openalex.org/W3035574168","https://openalex.org/W3118341329","https://openalex.org/W3167095230","https://openalex.org/W4225847518","https://openalex.org/W4312743914","https://openalex.org/W4383066393"],"related_works":[],"abstract_inverted_index":{"Pedestrian":[0],"detection":[1,44,88,110,145],"in":[2,13,45,66,106,123,146,150],"crowded":[3],"environments":[4],"is":[5,92],"a":[6,26],"critical":[7],"challenge":[8],"for":[9],"intelligent":[10],"systems,":[11],"particularly":[12,122,149],"urban":[14,151],"areas":[15],"where":[16,125],"safety":[17],"and":[18,35,78,102],"operational":[19],"efficiency":[20],"are":[21],"paramount.":[22],"This":[23,139],"paper":[24],"presents":[25],"novel":[27],"approach":[28,113],"that":[29,98],"leverages":[30],"3D":[31,101,108,119],"point":[32],"cloud":[33],"data":[34],"integrates":[36,99],"Feature":[37],"Pyramid":[38],"Networks":[39],"(FPN)":[40],"to":[41,51,63,142],"enhance":[42],"pedestrian":[43,144,155],"dense":[46],"crowds.":[47],"We":[48],"propose":[49],"modifications":[50],"the":[52,56,93,107,115],"2D":[53,103],"backbone":[54,104],"of":[55,96,117],"CenterPoint":[57],"network,":[58],"generating":[59],"larger":[60],"heatmap":[61],"sizes":[62],"improve":[64],"differentiation":[65],"closely":[67],"packed":[68],"scenes.":[69],"Additionally,":[70],"by":[71],"combining":[72],"multi-scale":[73],"features":[74,105],"from":[75],"both":[76,100],"high-":[77],"low-resolution":[79],"layers":[80],"using":[81],"FPN,":[82],"our":[83],"method":[84],"achieves":[85],"more":[86],"robust":[87],"performance.":[89],"Notably,":[90],"this":[91],"first":[94],"application":[95],"FPN":[97],"object":[109,120],"field.":[111],"Our":[112],"enhances":[114],"performance":[116],"LiDAR-based":[118],"detection,":[121],"conditions":[124],"camera-based":[126],"methods":[127],"struggle,":[128],"such":[129],"as":[130],"occlusion":[131],"under":[132],"extremely":[133],"strong":[134],"or":[135],"weak":[136],"lighting":[137],"conditions.":[138],"work":[140],"contributes":[141],"advancing":[143],"multimedia":[147],"environments,":[148],"spaces":[152],"with":[153],"high":[154],"density.":[156]},"counts_by_year":[],"updated_date":"2026-01-22T23:29:09.771500","created_date":"2026-01-21T00:00:00"}
