{"id":"https://openalex.org/W6891715243","doi":"https://doi.org/10.4233/uuid:983cffe4-f7ac-47bc-9fdc-8b671008c23c","title":"Visual Detection and Pose Estimation of Vulnerable Road Users for Automated Driving","display_name":"Visual Detection and Pose Estimation of Vulnerable Road Users for Automated Driving","publication_year":2022,"publication_date":"2022-11-16","ids":{"openalex":"https://openalex.org/W6891715243","doi":"https://doi.org/10.4233/uuid:983cffe4-f7ac-47bc-9fdc-8b671008c23c"},"language":"en","primary_location":{"id":"pmh:oai:tudelft.nl:uuid:983cffe4-f7ac-47bc-9fdc-8b671008c23c","is_oa":false,"landing_page_url":"http://resolver.tudelft.nl/uuid:983cffe4-f7ac-47bc-9fdc-8b671008c23c","pdf_url":null,"source":{"id":"https://openalex.org/S4306400906","display_name":"Research Repository (Delft University of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98358874","host_organization_name":"Delft University of Technology","host_organization_lineage":["https://openalex.org/I98358874"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"doctoral thesis"},"type":"dissertation","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.4233/uuid:983cffe4-f7ac-47bc-9fdc-8b671008c23c","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Braun, M.","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Braun, M.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.40230000019073486,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.40230000019073486,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.13519999384880066,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.12399999797344208,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.7279999852180481},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.6617000102996826},{"id":"https://openalex.org/keywords/advanced-driver-assistance-systems","display_name":"Advanced driver assistance systems","score":0.647599995136261},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.6392999887466431},{"id":"https://openalex.org/keywords/orientation","display_name":"Orientation (vector space)","score":0.5692999958992004},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5612000226974487},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.531000018119812},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.49390000104904175},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.40070000290870667}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7498000264167786},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.7279999852180481},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6740999817848206},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.6617000102996826},{"id":"https://openalex.org/C87833898","wikidata":"https://www.wikidata.org/wiki/Q1060280","display_name":"Advanced driver assistance systems","level":2,"score":0.647599995136261},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.6392999887466431},{"id":"https://openalex.org/C16345878","wikidata":"https://www.wikidata.org/wiki/Q107472979","display_name":"Orientation (vector space)","level":2,"score":0.5692999958992004},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5622000098228455},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5612000226974487},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.531000018119812},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.49390000104904175},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.40070000290870667},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.3799000084400177},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.3783999979496002},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3723999857902527},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.366100013256073},{"id":"https://openalex.org/C47796450","wikidata":"https://www.wikidata.org/wiki/Q508378","display_name":"Intelligent transportation system","level":2,"score":0.3328999876976013},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33000001311302185},{"id":"https://openalex.org/C2780156472","wikidata":"https://www.wikidata.org/wiki/Q2355550","display_name":"Pedestrian detection","level":3,"score":0.31369999051094055},{"id":"https://openalex.org/C145804949","wikidata":"https://www.wikidata.org/wiki/Q478123","display_name":"Situation awareness","level":2,"score":0.2955000102519989},{"id":"https://openalex.org/C5339829","wikidata":"https://www.wikidata.org/wiki/Q1425977","display_name":"Machine vision","level":2,"score":0.29510000348091125},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.28049999475479126},{"id":"https://openalex.org/C51399673","wikidata":"https://www.wikidata.org/wiki/Q504027","display_name":"Lidar","level":2,"score":0.2797999978065491},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2702000141143799},{"id":"https://openalex.org/C193415008","wikidata":"https://www.wikidata.org/wiki/Q639681","display_name":"Network architecture","level":2,"score":0.2687999904155731},{"id":"https://openalex.org/C178253425","wikidata":"https://www.wikidata.org/wiki/Q162668","display_name":"Visual perception","level":3,"score":0.2685999870300293},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.2587999999523163},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.25619998574256897},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2500999867916107}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:tudelft.nl:uuid:983cffe4-f7ac-47bc-9fdc-8b671008c23c","is_oa":false,"landing_page_url":"http://resolver.tudelft.nl/uuid:983cffe4-f7ac-47bc-9fdc-8b671008c23c","pdf_url":null,"source":{"id":"https://openalex.org/S4306400906","display_name":"Research Repository (Delft University of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98358874","host_organization_name":"Delft University of Technology","host_organization_lineage":["https://openalex.org/I98358874"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"doctoral thesis"},{"id":"doi:10.4233/uuid:983cffe4-f7ac-47bc-9fdc-8b671008c23c","is_oa":true,"landing_page_url":"https://doi.org/10.4233/uuid:983cffe4-f7ac-47bc-9fdc-8b671008c23c","pdf_url":null,"source":{"id":"https://openalex.org/S4306400906","display_name":"Research Repository (Delft University of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98358874","host_organization_name":"Delft University of Technology","host_organization_lineage":["https://openalex.org/I98358874"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"thesis"}],"best_oa_location":{"id":"doi:10.4233/uuid:983cffe4-f7ac-47bc-9fdc-8b671008c23c","is_oa":true,"landing_page_url":"https://doi.org/10.4233/uuid:983cffe4-f7ac-47bc-9fdc-8b671008c23c","pdf_url":null,"source":{"id":"https://openalex.org/S4306400906","display_name":"Research Repository (Delft University of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98358874","host_organization_name":"Delft University of Technology","host_organization_lineage":["https://openalex.org/I98358874"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"thesis"},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","score":0.6629877686500549,"id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"This":[0,36,72,772],"thesis":[1,24,135,147,396,527,628,820,832],"addresses":[2],"the":[3,27,74,81,104,115,157,168,228,264,275,294,300,314,319,322,329,339,348,355,391,398,488,501,511,520,529,532,536,544,554,558,569,581,593,596,608,623,627,638,648,666,714,732,748,766,775,790,807,819,824,827,831,835,848,870,877],"topic":[4],"of":[5,21,29,60,83,117,159,240,283,296,313,321,328,341,350,394,407,414,438,459,479,487,514,531,549,565,586,595,610,621,626,640,651,695,717,734,743,798,806,818,826,830,853,869,879],"visual":[6,47,112],"person":[7,128,445,467,480],"detection":[8,129,178,261,304,374,468,504,611,673],"and":[9,70,92,110,130,165,179,208,270,305,352,361,389,411,417,553,562,606,612,674,711,739,757,833,851,858,866],"pose":[10,131,613,699,758,777,812],"estimation.":[11,132],"While":[12],"these":[13,141,515],"tasks":[14,142,633],"are":[15,235,384,493,523,761],"relevant":[16],"for":[17,88,127,140,162,175,219,227,259,268,302,324,426,466,500,568,634,681,692,796,810,838,855,873],"a":[18,50,57,172,183,325,335,404,432,476,602,643,697,721,726,740,781,804],"broad":[19],"range":[20],"applications,":[22],"this":[23,134,395,427,526,690,787],"focuses":[25,150,629],"on":[26,151,156,216,274,557,630,706,786],"domain":[28,37],"intelligent":[30,169],"vehicles":[31,170],"in":[32,76,167,263,338,344,354,420,435,449,469,575,592,618,659,672,720,801,814],"urban":[33,421],"traffic":[34,61,422,470,577],"scenes.":[35,423,471,578],"is":[38,125,189,194,225,256,308,358,367,455,590,615,702,746,752,774],"particularly":[39],"interesting":[40],"due":[41],"to":[42,46,96,102,121,371,386,496,656],"specific":[43],"challenges":[44],"related":[45],"perception":[48],"from":[49,780,823],"moving":[51,433,782],"vehicle.":[52,783],"Accident":[53],"statistics":[54],"show":[55,278,793],"that":[56,237,279,365,683,704],"great":[58,336],"proportion":[59],"fatalities":[62],"affect":[63],"vulnerable":[64],"road":[65],"users":[66],"such":[67,635,718],"as":[68,247,249,498,653,709,765],"pedestrians":[69,351,652,682],"riders.":[71],"motivates":[73],"interest":[75],"reproducing":[77],"or":[78],"even":[79],"surpassing":[80],"capabilities":[82,513],"an":[84,198,209],"attentive":[85],"human":[86,111,811],"driver":[87,89],"assistance":[90],"systems":[91],"fully":[93],"automated":[94,839,874],"driving":[95,875],"improve":[97,663],"safety.":[98],"Deep":[99],"learning":[100,138,343,491,599,857],"contributed":[101],"narrowing":[103],"performance":[105,375,795,837],"gap":[106],"between":[107,604],"computer":[108,345],"visionmethods":[109],"perception.":[113],"Especially":[114],"capability":[116],"convolutional":[118,186,200,728],"neural":[119,187,644,729],"networks":[120],"learn":[122],"powerful":[123],"features":[124],"helpful":[126],"Throughout":[133],"new":[136,160,502,521,698,791],"deep":[137,185,342,490,598,727,856],"methods":[139,234],"will":[143],"be":[144,290],"presented.":[145,190],"The":[146,191,213,252,272,424,472,784],"not":[148,662],"only":[149],"methodical":[152,573,864],"extensions":[153],"but":[154],"also":[155,616],"creation":[158],"datasets":[161,383,463,736],"training,":[163],"evaluation,":[164],"benchmarking":[166,262],"domain.&lt;br/&gt;First,":[171],"novel":[173],"approach":[174],"joint":[176,303],"object":[177,220,260,373,503,550],"orientation":[180,192,306,481,551],"estimation":[181,193,307,614,676,700,813],"with":[182,203,310,508,519,642,670,789,803],"single":[184,722],"network":[188,201,214,645],"implemented":[195],"by":[196,280,376,754],"extending":[197],"existing":[199],"architecture":[202,646],"several":[204],"carefully":[205],"designed":[206],"layers":[207],"appropriate":[210],"loss":[211],"function.":[212],"depends":[215],"external":[217],"proposals":[218,282,297],"candidate":[221],"regions,":[222],"whose":[223],"accuracy":[224],"crucial":[226],"overall":[229],"performance.":[230,664],"Therefore,":[231],"two":[232,715],"proposal":[233],"introduced":[236],"make":[238],"use":[239],"3D":[241],"sensor":[242,285],"data":[243,332,854],"-":[244],"precisely":[245],"stereo":[246],"well":[248],"lidar":[250],"data.":[251],"KITTI":[253,276,356],"dataset,":[254,401],"which":[255,402,589,760],"commonly":[257,582],"used":[258,464,583],"automotive":[265,735],"domain,":[266],"serves":[267],"training":[269,533,868],"evaluation.":[271],"experiments":[273,507,667,785],"dataset":[277,357,387,428,473,522,537,545,751,773,778,788],"combining":[281],"both":[284,632],"modalities,":[286],"high":[287],"recall":[288,605],"can":[289],"achieved":[291],"while":[292],"keeping":[293],"number":[295,349,406,478],"low.":[298],"Furthermore,":[299,525,841],"method":[301,701,792,809],"competitive":[309],"other":[311,418],"state":[312,320,486,805],"art":[315,323,489,808],"approaches.":[316],"It":[317],"outperforms":[318],"test":[326],"scenario":[327],"bicycle":[330],"class.&lt;br/&gt;Big":[331],"has":[333],"had":[334],"share":[337],"success":[340],"vision.":[346],"Still,":[347],"riders":[353,419],"rather":[359],"limited":[360],"previous":[362,509,828],"works":[363],"suggest":[364],"there":[366],"significant":[368],"further":[369,654],"potential":[370,860],"increase":[372],"utilizing":[377],"bigger":[378],"datasets.":[379],"Regarding":[380],"benchmarking,":[381],"small":[382],"prone":[385],"bias":[388],"overfitting.&lt;br/&gt;Therefore,":[390],"second":[392],"part":[393,625],"introduces":[397],"EuroCity":[399,453,749,767],"Persons":[400,454,750,768],"provides":[403],"large":[405,477],"highly":[408,684],"diverse,":[409],"accurate,":[410],"detailed":[412],"annotations":[413,482],"pedestrians,":[415],"cyclists,":[416],"images":[425,756],"were":[429],"collected":[430],"onboard":[431],"vehicle":[434],"31":[436],"cities":[437],"12":[439],"European":[440],"countries.":[441],"With":[442],"over":[443,450],"238200":[444],"instances":[446],"manually":[447],"labeled":[448],"47300":[451],"images,":[452],"nearly":[456],"one":[457],"order":[458],"magnitude":[460],"larger":[461],"than":[462],"previously":[465],"furthermore":[474],"contains":[475],"(over":[483],"211200).":[484],"Four":[485],"approaches":[492],"thoroughly":[494],"optimized":[495],"serve":[497],"baselines":[499],"benchmark.":[505],"In":[506],"datasets,":[510],"generalization":[512],"detectors":[516],"when":[517],"trained":[518],"analyzed.":[524],"studies":[528],"effect":[530],"set":[534],"size,":[535],"diversity":[538],"(day-":[539],"vs.":[540],"night-time,":[541],"geographical":[542],"region),":[543],"detail":[546],"(i.e.,":[547],"availability":[548,733],"information),":[552],"annotation":[555],"quality":[556],"detector":[559,571],"performance.&lt;br/&gt;The":[560],"qualitative":[561],"quantitative":[563],"analysis":[564],"error":[566],"sources":[567],"best-performing":[570],"reveals":[572],"weaknesses":[574],"dense":[576,619],"For":[579],"these,":[580],"(greedy)":[584],"implementation":[585],"non-maximum":[587],"suppression,":[588],"needed":[591],"post-processing":[594],"analyzed":[597],"methods,":[600],"poses":[601,716,738,797],"tradeoff":[603],"precision.&lt;br/&gt;As":[607],"robustness":[609],"important":[617],"groups":[620,660],"persons,":[622],"third":[624],"improving":[631],"scenarios.":[636],"Learning":[637],"task":[639],"non-maximumsuppression":[641],"incorporating":[647],"head":[649,678],"boxes":[650],"attributes":[655],"discriminate":[657],"persons":[658,696],"does":[661],"Yet,":[665],"reveal":[668],"issues":[669],"ambiguities":[671],"attribute":[675],"(e.g.":[677],"box":[679],"estimation)":[680],"overlap":[685],"each":[686],"other.":[687],"To":[688],"solve":[689],"ambiguity":[691],"pairwise":[693,707],"constellations":[694],"proposed":[703],"relies":[705],"detections":[708],"input":[710],"jointly":[712],"estimates":[713],"pairs":[719,800],"forward":[723],"pass":[724],"within":[725],"network.":[730],"As":[731],"providing":[737],"fair":[741],"amount":[742],"crowded":[744],"scenes":[745],"limited,":[747],"extended":[753],"additional":[755],"annotations,":[759],"made":[762],"publicly":[763],"available":[764],"Dense":[769],"Pose":[770],"dataset.":[771],"largest":[776],"recorded":[779],"improved":[794],"pedestrian":[799],"comparison":[802],"crowds.&lt;br/&gt;The":[815],"final":[816],"chapter":[817],"draws":[821],"conclusions":[822],"content":[825],"chapters":[829],"discusses":[834],"required":[836],"driving.":[840],"it":[842],"reasons":[843],"about":[844],"efficiency":[845],"aspects":[846],"regarding":[847,863],"collection,":[849],"annotation,":[850],"usage":[852],"presents":[859],"future":[861],"work":[862],"improvements":[865],"end-to-end":[867],"functional":[871],"chain":[872],"including":[876],"integration":[878],"multiple":[880],"sensors.":[881]},"counts_by_year":[],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
