{"id":"https://openalex.org/W7131127121","doi":"https://doi.org/10.1109/iccvw69036.2025.00090","title":"Drama-X: A Fine-Grained Intent Prediction and Risk Reasoning Benchmark for Driving","display_name":"Drama-X: A Fine-Grained Intent Prediction and Risk Reasoning Benchmark for Driving","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W7131127121","doi":"https://doi.org/10.1109/iccvw69036.2025.00090"},"language":null,"primary_location":{"id":"doi:10.1109/iccvw69036.2025.00090","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccvw69036.2025.00090","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision Workshops (ICCVW)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5047558204","display_name":"Mihir Godbole","orcid":"https://orcid.org/0009-0009-9166-8332"},"institutions":[{"id":"https://openalex.org/I91045830","display_name":"Texas A&M University","ror":"https://ror.org/01f5ytq51","country_code":"US","type":"education","lineage":["https://openalex.org/I91045830"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Mihir Godbole","raw_affiliation_strings":["Texas A&#x0026;M University"],"affiliations":[{"raw_affiliation_string":"Texas A&#x0026;M University","institution_ids":["https://openalex.org/I91045830"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126605615","display_name":"Xiangbo Gao","orcid":null},"institutions":[{"id":"https://openalex.org/I91045830","display_name":"Texas A&M University","ror":"https://ror.org/01f5ytq51","country_code":"US","type":"education","lineage":["https://openalex.org/I91045830"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiangbo Gao","raw_affiliation_strings":["Texas A&#x0026;M University"],"affiliations":[{"raw_affiliation_string":"Texas A&#x0026;M University","institution_ids":["https://openalex.org/I91045830"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015173810","display_name":"Zhengzhong Tu","orcid":"https://orcid.org/0000-0002-7594-2292"},"institutions":[{"id":"https://openalex.org/I91045830","display_name":"Texas A&M University","ror":"https://ror.org/01f5ytq51","country_code":"US","type":"education","lineage":["https://openalex.org/I91045830"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhengzhong Tu","raw_affiliation_strings":["Texas A&#x0026;M University"],"affiliations":[{"raw_affiliation_string":"Texas A&#x0026;M University","institution_ids":["https://openalex.org/I91045830"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5047558204"],"corresponding_institution_ids":["https://openalex.org/I91045830"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.75051008,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"826","last_page":"831"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.1891999989748001,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.1891999989748001,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.12880000472068787,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.12790000438690186,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7609999775886536},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.5582000017166138},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.542900025844574},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5235000252723694},{"id":"https://openalex.org/keywords/intersection","display_name":"Intersection (aeronautics)","score":0.4611999988555908},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.44769999384880066},{"id":"https://openalex.org/keywords/visual-reasoning","display_name":"Visual reasoning","score":0.40779998898506165},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.39660000801086426},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.3905999958515167}],"concepts":[{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7609999775886536},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6855000257492065},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6338000297546387},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.5582000017166138},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5534999966621399},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.542900025844574},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5235000252723694},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.4611999988555908},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.44769999384880066},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.40779998898506165},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.39660000801086426},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.3905999958515167},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.36579999327659607},{"id":"https://openalex.org/C83725634","wikidata":"https://www.wikidata.org/wiki/Q7268699","display_name":"Qualitative reasoning","level":2,"score":0.35740000009536743},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.35409998893737793},{"id":"https://openalex.org/C171268870","wikidata":"https://www.wikidata.org/wiki/Q1486676","display_name":"GRASP","level":2,"score":0.3377000093460083},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3248000144958496},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.31949999928474426},{"id":"https://openalex.org/C20162079","wikidata":"https://www.wikidata.org/wiki/Q1151406","display_name":"Case-based reasoning","level":2,"score":0.3109000027179718},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.3075000047683716},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.2930000126361847},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.29109999537467957},{"id":"https://openalex.org/C9616225","wikidata":"https://www.wikidata.org/wiki/Q3929429","display_name":"Semantic reasoner","level":2,"score":0.2851000130176544},{"id":"https://openalex.org/C57077369","wikidata":"https://www.wikidata.org/wiki/Q7075747","display_name":"Occupancy grid mapping","level":4,"score":0.28439998626708984},{"id":"https://openalex.org/C87833898","wikidata":"https://www.wikidata.org/wiki/Q1060280","display_name":"Advanced driver assistance systems","level":2,"score":0.2775000035762787},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.2759999930858612},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.25839999318122864},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.25760000944137573},{"id":"https://openalex.org/C186594467","wikidata":"https://www.wikidata.org/wiki/Q1429176","display_name":"Flooding (psychology)","level":2,"score":0.2572999894618988}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iccvw69036.2025.00090","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccvw69036.2025.00090","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision Workshops (ICCVW)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4344121515750885,"display_name":"Gender equality","id":"https://metadata.un.org/sdg/5"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W2101415982","https://openalex.org/W2115579991","https://openalex.org/W2277195237","https://openalex.org/W2561603333","https://openalex.org/W2771583656","https://openalex.org/W2990711573","https://openalex.org/W2991484432","https://openalex.org/W3035564946","https://openalex.org/W3035574168","https://openalex.org/W3046330049","https://openalex.org/W3156216502","https://openalex.org/W3211740586","https://openalex.org/W4319300501","https://openalex.org/W4390871914","https://openalex.org/W4393153738","https://openalex.org/W4399772534","https://openalex.org/W4399881122","https://openalex.org/W4402727624","https://openalex.org/W4404820176"],"related_works":[],"abstract_inverted_index":{"Understanding":[0],"the":[1,59],"short-term":[2],"motion":[3],"of":[4],"vulnerable":[5],"road":[6],"users":[7],"(VRUs)":[8],"is":[9,141],"critical":[10,143],"for":[11,30,145],"safe":[12],"autonomous":[13,106],"driving,":[14],"especially":[15],"in":[16,44],"high-risk":[17],"urban":[18],"scenarios.":[19],"While":[20],"vision-language":[21],"models":[22],"(VLMs)":[23],"have":[24],"enabled":[25],"open-vocabulary":[26],"perception,":[27],"their":[28],"utility":[29],"fine-grained":[31,55],"intent":[32,42,80,130],"reasoning":[33,110,128],"remains":[34],"underexplored.":[35],"Notably,":[36],"no":[37],"existing":[38],"benchmark":[39,56],"evaluates":[40],"multi-class":[41],"prediction":[43,131],"safety-critical":[45],"situations.":[46],"To":[47],"address":[48],"this":[49],"gap,":[50],"we":[51,93],"introduce":[52],"DRAMA-X,":[53],"a":[54,77,90,96,115,142],"constructed":[57],"from":[58],"DRAMA":[60],"dataset":[61,151],"via":[62],"an":[63,102],"automated":[64],"annotation":[65],"pipeline.":[66],"DRAMA-X":[67],"contains":[68],"5,686":[69],"accident-prone":[70],"frames":[71],"labeled":[72],"with":[73],"object":[74,139],"bounding":[75],"boxes,":[76],"nine-class":[78],"directional":[79],"taxonomy,":[81],"binary":[82],"risk":[83,133],"scores,":[84],"and":[85,120,132,135,150],"expert-generated":[86],"action":[87],"suggestions.":[88],"As":[89],"reference":[91],"baseline,":[92],"propose":[94],"SGG-Intent,":[95],"lightweight,":[97],"training-free":[98],"framework":[99],"that":[100,126,137],"mirrors":[101],"ego":[103],"vehicle":[104,107],"(the":[105],"under":[108],"consideration)'s":[109],"pipeline":[111],"by":[112],"sequentially":[113],"generating":[114],"scene":[116],"graph,":[117],"inferring":[118],"intent,":[119],"assessing":[121],"risk.":[122],"Our":[123,148],"experiments":[124],"demonstrate":[125],"scene-graph-based":[127],"enhances":[129],"assessment,":[134],"reveal":[136],"precise":[138],"localization":[140],"bottleneck":[144],"current":[146],"VLMs.":[147],"code":[149],"are":[152],"available":[153],"at:":[154],"https://github.com/taco-group/DRAMA-X.":[155]},"counts_by_year":[],"updated_date":"2026-02-25T06:17:34.324206","created_date":"2026-02-24T00:00:00"}
