{"id":"https://openalex.org/W3015750515","doi":"https://doi.org/10.1109/icassp40776.2020.9054009","title":"Object Detection with Color and Depth Images with Multi-Reduced Region Proposal Network and Multi-Pooling","display_name":"Object Detection with Color and Depth Images with Multi-Reduced Region Proposal Network and Multi-Pooling","publication_year":2020,"publication_date":"2020-04-09","ids":{"openalex":"https://openalex.org/W3015750515","doi":"https://doi.org/10.1109/icassp40776.2020.9054009","mag":"3015750515"},"language":"en","primary_location":{"id":"doi:10.1109/icassp40776.2020.9054009","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp40776.2020.9054009","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5003059876","display_name":"Jiou-Ai Lin","orcid":null},"institutions":[{"id":"https://openalex.org/I25846049","display_name":"National Tsing Hua University","ror":"https://ror.org/00zdnkx70","country_code":"TW","type":"education","lineage":["https://openalex.org/I25846049"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Jiou-Ai Lin","raw_affiliation_strings":["Department of Computer Science, National Tsing Hua University, Hsinchu, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, National Tsing Hua University, Hsinchu, Taiwan","institution_ids":["https://openalex.org/I25846049"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064665970","display_name":"Ching Te Chiu","orcid":null},"institutions":[{"id":"https://openalex.org/I25846049","display_name":"National Tsing Hua University","ror":"https://ror.org/00zdnkx70","country_code":"TW","type":"education","lineage":["https://openalex.org/I25846049"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Ching - Te Chiu","raw_affiliation_strings":["Department of Computer Science, National Tsing Hua University, Hsinchu, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, National Tsing Hua University, Hsinchu, Taiwan","institution_ids":["https://openalex.org/I25846049"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5065063996","display_name":"Yen-Yu Cheng","orcid":"https://orcid.org/0000-0002-5267-6980"},"institutions":[{"id":"https://openalex.org/I25846049","display_name":"National Tsing Hua University","ror":"https://ror.org/00zdnkx70","country_code":"TW","type":"education","lineage":["https://openalex.org/I25846049"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Yen-Yu Cheng","raw_affiliation_strings":["Department of Computer Science, National Tsing Hua University, Hsinchu, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, National Tsing Hua University, Hsinchu, Taiwan","institution_ids":["https://openalex.org/I25846049"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5003059876"],"corresponding_institution_ids":["https://openalex.org/I25846049"],"apc_list":null,"apc_paid":null,"fwci":0.2931,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.5459266,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1618","last_page":"1622"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.7927395105361938},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.779836893081665},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.7415749430656433},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7297242283821106},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.6761032342910767},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5479221343994141},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5014925003051758},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.47817856073379517},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.4514273405075073},{"id":"https://openalex.org/keywords/base","display_name":"Base (topology)","score":0.43491312861442566},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3912423849105835},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08786198496818542}],"concepts":[{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.7927395105361938},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.779836893081665},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.7415749430656433},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7297242283821106},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.6761032342910767},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5479221343994141},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5014925003051758},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.47817856073379517},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4514273405075073},{"id":"https://openalex.org/C42058472","wikidata":"https://www.wikidata.org/wiki/Q810214","display_name":"Base (topology)","level":2,"score":0.43491312861442566},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3912423849105835},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08786198496818542},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp40776.2020.9054009","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp40776.2020.9054009","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.5600000023841858}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1686810756","https://openalex.org/W1923184257","https://openalex.org/W2031489346","https://openalex.org/W2108598243","https://openalex.org/W2125389748","https://openalex.org/W2155893237","https://openalex.org/W2229637417","https://openalex.org/W2463032559","https://openalex.org/W2598666589","https://openalex.org/W2613718673","https://openalex.org/W2780829839","https://openalex.org/W2788333383","https://openalex.org/W2895359088","https://openalex.org/W2962888833","https://openalex.org/W2963000224","https://openalex.org/W2963446712","https://openalex.org/W2969649120","https://openalex.org/W2980698950","https://openalex.org/W3106250896","https://openalex.org/W6620707391","https://openalex.org/W6637373629","https://openalex.org/W6678583879","https://openalex.org/W6725543821","https://openalex.org/W6748662280","https://openalex.org/W6785652829"],"related_works":["https://openalex.org/W2953234277","https://openalex.org/W2626256601","https://openalex.org/W147410782","https://openalex.org/W2900413183","https://openalex.org/W2949096641","https://openalex.org/W2970686063","https://openalex.org/W4320729701","https://openalex.org/W3210378990","https://openalex.org/W3034745255","https://openalex.org/W4254103348"],"abstract_inverted_index":{"Object":[0],"detection":[1,51,74],"technology":[2],"has":[3],"received":[4],"increasing":[5],"research":[6],"attention":[7],"with":[8,40,106,134,152],"recent":[9],"developments":[10],"in":[11,16,34],"automation":[12],"technology.":[13],"Most":[14],"studies":[15],"this":[17,35],"field,":[18],"however,":[19],"use":[20,31,38],"RGB":[21,42],"images":[22,39],"as":[23,46,81],"input":[24,47],"to":[25,48,78,91,126,146],"deep-learning":[26],"classifiers,":[27],"and":[28,43,66,71,112],"they":[29],"rarely":[30],"depth":[32,44,80,117],"information.So,":[33],"paper,":[36],"we":[37,67,83,156],"both":[41],"information":[45,118],"an":[49],"object":[50,73],"network.":[52],"We":[53,97],"base":[54],"our":[55],"network":[56],"on":[57,94],"the":[58,86,100,120,130,138,142,159,177],"Faster":[59],"R-CNN":[60],"proposed":[61],"by":[62,122],"Shih":[63],"et":[64],"al.,":[65],"develop":[68],"a":[69],"fast":[70],"accurate":[72],"architecture.":[75],"In":[76],"addition":[77],"adding":[79],"input,":[82],"also":[84,98],"adjust":[85],"type":[87],"of":[88,102,114,161],"anchor":[89,139],"boxes":[90,140],"improve":[92],"performance":[93],"some":[95],"objects.":[96],"discuss":[99],"impact":[101],"pooling":[103],"training":[104],"data":[105],"multiple":[107],"region":[108],"proposal":[109],"networks":[110],"(RPN)":[111],"regions":[113],"interest":[115],"(ROI).Adding":[116],"improved":[119,141],"mAP":[121,143],"8.15%,":[123],"from":[124,144],"36.86%":[125],"45.01%,":[127],"when":[128],"using":[129],"SUN":[131],"RGB-D":[132],"dataset":[133],"10":[135],"classes.":[136],"Optimizing":[137],"45.01%":[145],"45.88%.":[147],"After":[148],"testing":[149],"various":[150],"architectures":[151],"different":[153],"reduced":[154],"RPNs,":[155],"find":[157],"that":[158],"model":[160],"1RRPN-2ROIP":[162],"performs":[163],"best.":[164],"The":[165],"running":[166],"time":[167],"is":[168,172],"0.123":[169],"s,":[170],"which":[171],"1.8":[173],"times":[174],"faster":[175],"than":[176],"3D-SSD":[178],"model.":[179]},"counts_by_year":[{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
