{"id":"https://openalex.org/W3176270532","doi":"https://doi.org/10.1145/3457682.3457747","title":"Semantically Enhanced Multi-scale Feature Pyramid Fusion for Pedestrian Detection","display_name":"Semantically Enhanced Multi-scale Feature Pyramid Fusion for Pedestrian Detection","publication_year":2021,"publication_date":"2021-02-26","ids":{"openalex":"https://openalex.org/W3176270532","doi":"https://doi.org/10.1145/3457682.3457747","mag":"3176270532"},"language":"en","primary_location":{"id":"doi:10.1145/3457682.3457747","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3457682.3457747","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 13th International Conference on Machine Learning and Computing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100384655","display_name":"Jun Wang","orcid":"https://orcid.org/0000-0001-9223-2615"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jun Wang","raw_affiliation_strings":["University of Science and Technology Beijing, China"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101989915","display_name":"Chao Zhu","orcid":"https://orcid.org/0000-0001-5486-7492"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chao Zhu","raw_affiliation_strings":["University of Science and Technology Beijing, China"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5100384655"],"corresponding_institution_ids":["https://openalex.org/I92403157"],"apc_list":null,"apc_paid":null,"fwci":0.1921,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.47704248,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"423","last_page":"431"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pedestrian-detection","display_name":"Pedestrian detection","score":0.902439296245575},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7949842214584351},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.7402420043945312},{"id":"https://openalex.org/keywords/pyramid","display_name":"Pyramid (geometry)","score":0.6648508310317993},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.6185984015464783},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.61543208360672},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6008914113044739},{"id":"https://openalex.org/keywords/pedestrian","display_name":"Pedestrian","score":0.5876824855804443},{"id":"https://openalex.org/keywords/semantic-feature","display_name":"Semantic feature","score":0.5675759315490723},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5555737018585205},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5092200040817261},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.47626492381095886},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.45190751552581787},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4128498435020447},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.38800913095474243},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.11014288663864136},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.06466630101203918}],"concepts":[{"id":"https://openalex.org/C2780156472","wikidata":"https://www.wikidata.org/wiki/Q2355550","display_name":"Pedestrian detection","level":3,"score":0.902439296245575},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7949842214584351},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.7402420043945312},{"id":"https://openalex.org/C142575187","wikidata":"https://www.wikidata.org/wiki/Q3358290","display_name":"Pyramid (geometry)","level":2,"score":0.6648508310317993},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.6185984015464783},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.61543208360672},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6008914113044739},{"id":"https://openalex.org/C2777113093","wikidata":"https://www.wikidata.org/wiki/Q221488","display_name":"Pedestrian","level":2,"score":0.5876824855804443},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.5675759315490723},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5555737018585205},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5092200040817261},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.47626492381095886},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.45190751552581787},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4128498435020447},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.38800913095474243},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.11014288663864136},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.06466630101203918},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C22212356","wikidata":"https://www.wikidata.org/wiki/Q775325","display_name":"Transport engineering","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3457682.3457747","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3457682.3457747","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 13th International Conference on Machine Learning and Computing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7900000214576721,"id":"https://metadata.un.org/sdg/11","display_name":"Sustainable cities and communities"}],"awards":[{"id":"https://openalex.org/G7993496336","display_name":null,"funder_award_id":"61703039, 62072032","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W2031454541","https://openalex.org/W2108598243","https://openalex.org/W2193145675","https://openalex.org/W2579985080","https://openalex.org/W2883363148","https://openalex.org/W2895451584","https://openalex.org/W2896540732","https://openalex.org/W2899607431","https://openalex.org/W2962850098","https://openalex.org/W2963315052","https://openalex.org/W2963381188","https://openalex.org/W2963681621","https://openalex.org/W2963903399","https://openalex.org/W3106250896"],"related_works":["https://openalex.org/W2972620127","https://openalex.org/W2981141433","https://openalex.org/W2802018156","https://openalex.org/W4313315626","https://openalex.org/W2101531944","https://openalex.org/W2348780717","https://openalex.org/W2922437833","https://openalex.org/W4312696271","https://openalex.org/W4223892596","https://openalex.org/W2933098581"],"abstract_inverted_index":{"Detecting":[0],"multi-scale":[1,44,52,67,78,82,150,161,197],"pedestrians":[2],"(especially":[3],"small":[4],"scale":[5],"ones)":[6],"is":[7,36],"one":[8],"of":[9,39,43,89,160,193],"the":[10,114,120,138,178,194],"most":[11,20],"challenging":[12],"problems":[13],"in":[14,29,50,61,137],"computer":[15],"vision":[16],"community.":[17],"At":[18],"present,":[19],"existing":[21],"pedestrian":[22,83,139,198],"detectors":[23],"only":[24],"adopt":[25],"single-scale":[26],"feature":[27,45,68,79,117,151,162],"map":[28],"their":[30],"backbone":[31],"network":[32],"for":[33,81],"detection,":[34],"which":[35],"not":[37],"capable":[38],"fully":[40],"taking":[41],"advantages":[42,159],"information,":[46,129],"and":[47,76,99,164,181],"thus":[48],"resulting":[49],"unsatisfactory":[51],"detection":[53,144,171],"performance.":[54,145],"To":[55],"address":[56],"this":[57,62],"issue,":[58],"we":[59],"propose":[60],"paper":[63],"a":[64],"semantically":[65],"enhanced":[66,124],"pyramid":[69],"fusion":[70],"method":[71,87,186],"that":[72,131],"can":[73,133],"effectively":[74],"extract":[75],"integrate":[77],"maps":[80,152],"detection.":[84,199],"The":[85],"proposed":[86,185],"consists":[88],"two":[90],"main":[91],"components:":[92],"1)":[93],"Trapezoidal":[94],"Path":[95],"Augmented":[96],"Module":[97,104],"(TPAM)":[98],"2)":[100],"Multi-scale":[101],"Feature":[102],"Fusion":[103],"(MFFM).":[105],"TPAM":[106,155],"aims":[107,147],"at":[108,148],"extracting":[109],"higher-level":[110,116,127],"semantic":[111,128],"features":[112,122],"by":[113,169],"additional":[115],"layers,":[118],"where":[119],"produced":[121],"are":[123],"with":[125],"supplementary":[126],"so":[130],"they":[132],"focus":[134],"more":[135],"accurately":[136],"area,":[140],"leading":[141],"to":[142,156],"improved":[143],"MFFM":[146],"integrating":[149],"coming":[153],"from":[154],"further":[157],"take":[158],"information":[163],"reduce":[165],"computational":[166],"redundancy":[167],"caused":[168],"multiple":[170],"heads.":[172],"By":[173],"extensive":[174],"experimental":[175],"evaluations":[176],"on":[177,196],"popular":[179],"CityPersons":[180],"Caltech":[182],"benchmarks,":[183],"our":[184],"achieves":[187],"superior":[188],"performances":[189],"than":[190],"previous":[191],"state":[192],"arts":[195]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
