{"id":"https://openalex.org/W4413018004","doi":"https://doi.org/10.1109/iv64158.2025.11097349","title":"Pedestrian Intention Prediction via Vision-Language Foundation Models","display_name":"Pedestrian Intention Prediction via Vision-Language Foundation Models","publication_year":2025,"publication_date":"2025-06-22","ids":{"openalex":"https://openalex.org/W4413018004","doi":"https://doi.org/10.1109/iv64158.2025.11097349"},"language":"en","primary_location":{"id":"doi:10.1109/iv64158.2025.11097349","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iv64158.2025.11097349","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE Intelligent Vehicles Symposium (IV)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://discovery.ucl.ac.uk/10214825/1/2507.04141v1.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026516871","display_name":"Mohsen Azarmi","orcid":"https://orcid.org/0000-0003-0737-9204"},"institutions":[{"id":"https://openalex.org/I3144123604","display_name":"Department for Transport","ror":"https://ror.org/010mf0m52","country_code":"GB","type":"government","lineage":["https://openalex.org/I2802373619","https://openalex.org/I3144123604"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Mohsen Azarmi","raw_affiliation_strings":["Institute for Transport Studies, University of Leeds,Faculty of Environment, Computer Vision and Machine Learning Group,United Kingdom,LS2 9JT"],"affiliations":[{"raw_affiliation_string":"Institute for Transport Studies, University of Leeds,Faculty of Environment, Computer Vision and Machine Learning Group,United Kingdom,LS2 9JT","institution_ids":["https://openalex.org/I3144123604"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067789332","display_name":"Mahdi Rezaei","orcid":"https://orcid.org/0000-0003-3892-421X"},"institutions":[{"id":"https://openalex.org/I3144123604","display_name":"Department for Transport","ror":"https://ror.org/010mf0m52","country_code":"GB","type":"government","lineage":["https://openalex.org/I2802373619","https://openalex.org/I3144123604"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Mahdi Rezaei","raw_affiliation_strings":["Institute for Transport Studies, University of Leeds,Faculty of Environment, Computer Vision and Machine Learning Group,United Kingdom,LS2 9JT"],"affiliations":[{"raw_affiliation_string":"Institute for Transport Studies, University of Leeds,Faculty of Environment, Computer Vision and Machine Learning Group,United Kingdom,LS2 9JT","institution_ids":["https://openalex.org/I3144123604"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050061175","display_name":"He Wang","orcid":"https://orcid.org/0000-0002-2281-5679"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"He Wang","raw_affiliation_strings":["University College London,AI Centre,Department of Computer Science,London,United Kingdom,WC1E 6BT"],"affiliations":[{"raw_affiliation_string":"University College London,AI Centre,Department of Computer Science,London,United Kingdom,WC1E 6BT","institution_ids":["https://openalex.org/I45129253"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5026516871"],"corresponding_institution_ids":["https://openalex.org/I3144123604"],"apc_list":null,"apc_paid":null,"fwci":1.1783,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.81315233,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1899","last_page":"1904"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13282","display_name":"Automated Road and Building Extraction","score":0.9918000102043152,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pedestrian","display_name":"Pedestrian","score":0.8325316905975342},{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.694767415523529},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6276078224182129},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5149567723274231},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.44171464443206787},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.33275747299194336},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3221553862094879},{"id":"https://openalex.org/keywords/transport-engineering","display_name":"Transport engineering","score":0.20854654908180237},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1724606156349182},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.11457017064094543}],"concepts":[{"id":"https://openalex.org/C2777113093","wikidata":"https://www.wikidata.org/wiki/Q221488","display_name":"Pedestrian","level":2,"score":0.8325316905975342},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.694767415523529},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6276078224182129},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5149567723274231},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.44171464443206787},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.33275747299194336},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3221553862094879},{"id":"https://openalex.org/C22212356","wikidata":"https://www.wikidata.org/wiki/Q775325","display_name":"Transport engineering","level":1,"score":0.20854654908180237},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1724606156349182},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.11457017064094543},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/iv64158.2025.11097349","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iv64158.2025.11097349","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE Intelligent Vehicles Symposium (IV)","raw_type":"proceedings-article"},{"id":"pmh:oai:eprints.whiterose.ac.uk:229640","is_oa":false,"landing_page_url":"https://orcid.org/0000-0003-3892-421X>","pdf_url":null,"source":{"id":"https://openalex.org/S4306400854","display_name":"White Rose Research Online (University of Leeds, The University of Sheffield, University of York)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I2800616092","host_organization_name":"White Rose University Consortium","host_organization_lineage":["https://openalex.org/I2800616092"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"NonPeerReviewed"},{"id":"pmh:oai:eprints.ucl.ac.uk.OAI2:10214825","is_oa":true,"landing_page_url":"https://discovery.ucl.ac.uk/id/eprint/10214825/","pdf_url":"https://discovery.ucl.ac.uk/10214825/1/2507.04141v1.pdf","source":{"id":"https://openalex.org/S4306400024","display_name":"UCL Discovery (University College London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45129253","host_organization_name":"University College London","host_organization_lineage":["https://openalex.org/I45129253"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"In:  Proceedings of the 2025 IEEE INTELLIGENT VEHICLES SYMPOSIUM, IV.  (pp. pp. 1899-1904).  IEEE: Cluj-Napoca, Romania. (2025)","raw_type":"Proceedings paper"}],"best_oa_location":{"id":"pmh:oai:eprints.ucl.ac.uk.OAI2:10214825","is_oa":true,"landing_page_url":"https://discovery.ucl.ac.uk/id/eprint/10214825/","pdf_url":"https://discovery.ucl.ac.uk/10214825/1/2507.04141v1.pdf","source":{"id":"https://openalex.org/S4306400024","display_name":"UCL Discovery (University College London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45129253","host_organization_name":"University College London","host_organization_lineage":["https://openalex.org/I45129253"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"In:  Proceedings of the 2025 IEEE INTELLIGENT VEHICLES SYMPOSIUM, IV.  (pp. pp. 1899-1904).  IEEE: Cluj-Napoca, Romania. (2025)","raw_type":"Proceedings paper"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4413018004.pdf"},"referenced_works_count":40,"referenced_works":["https://openalex.org/W2012210378","https://openalex.org/W2592496287","https://openalex.org/W2883770893","https://openalex.org/W2963697717","https://openalex.org/W2968684599","https://openalex.org/W2991484432","https://openalex.org/W3008700642","https://openalex.org/W3110317294","https://openalex.org/W3119170582","https://openalex.org/W3119361198","https://openalex.org/W3182910206","https://openalex.org/W3195951281","https://openalex.org/W3209986245","https://openalex.org/W3214126613","https://openalex.org/W4285105848","https://openalex.org/W4285819379","https://openalex.org/W4308244910","https://openalex.org/W4365447993","https://openalex.org/W4366850747","https://openalex.org/W4385325527","https://openalex.org/W4386590862","https://openalex.org/W4389849804","https://openalex.org/W4396982312","https://openalex.org/W4398184793","https://openalex.org/W4399837667","https://openalex.org/W4400601342","https://openalex.org/W4401042136","https://openalex.org/W4402350970","https://openalex.org/W4402916392","https://openalex.org/W4403663158","https://openalex.org/W4404724663","https://openalex.org/W4410706709","https://openalex.org/W4410949610","https://openalex.org/W6776598532","https://openalex.org/W6846556436","https://openalex.org/W6851950068","https://openalex.org/W6855007681","https://openalex.org/W6869594802","https://openalex.org/W6870183580","https://openalex.org/W6873162891"],"related_works":["https://openalex.org/W2392100589","https://openalex.org/W2512789322","https://openalex.org/W3122828758","https://openalex.org/W2101960027","https://openalex.org/W4205958986","https://openalex.org/W2197846993","https://openalex.org/W49697837","https://openalex.org/W2586575957","https://openalex.org/W2170799233","https://openalex.org/W4320736889"],"abstract_inverted_index":{"Prediction":[0],"of":[1,15,33,128],"pedestrian":[2,40],"crossing":[3,16,41],"intention":[4,17,74],"is":[5],"a":[6],"critical":[7],"function":[8],"in":[9,73],"autonomous":[10,142],"vehicles.":[11],"Conventional":[12],"vision-based":[13,133],"methods":[14],"prediction":[18,102],"often":[19],"struggle":[20],"with":[21],"generalizability,":[22],"context":[23],"understanding,":[24],"and":[25,62,84,96,138],"causal":[26],"reasoning.":[27],"This":[28],"study":[29],"explores":[30],"the":[31,101,125],"potential":[32],"vision-language":[34],"foundation":[35],"models":[36],"(VLFMs)":[37],"for":[38,141],"predicting":[39],"intentions":[42],"by":[43],"integrating":[44],"multimodal":[45],"data":[46],"through":[47],"hierarchical":[48],"prompt":[49,114],"templates.":[50],"The":[51],"methodology":[52],"incorporates":[53],"contextual":[54,139],"information,":[55],"including":[56],"visual":[57],"frames,":[58],"physical":[59],"cues":[60],"observations,":[61],"ego-vehicle":[63],"dynamics,":[64],"into":[65],"systematically":[66],"refined":[67],"prompts":[68,98,109],"to":[69,105,131],"guide":[70],"VLFMs":[71,129],"effectively":[72],"prediction.":[75],"Experiments":[76],"were":[77],"conducted":[78],"on":[79],"three":[80],"common":[81],"datasets\u2014JAAD,":[82],"PIE,":[83],"FU-PIP.":[85],"Results":[86],"demonstrate":[87],"that":[88],"incorporating":[89],"vehicle":[90],"speed,":[91],"its":[92],"variations":[93],"over":[94],"time,":[95],"time-conscious":[97],"significantly":[99],"enhances":[100],"accuracy":[103,120],"up":[104],"19.8%.":[106],"Additionally,":[107],"optimised":[108],"generated":[110],"via":[111],"an":[112],"automatic":[113],"engineering":[115],"framework":[116],"yielded":[117],"12.5%":[118],"further":[119],"gains.":[121],"These":[122],"findings":[123],"highlight":[124],"superior":[126],"performance":[127],"compared":[130],"conventional":[132],"models,":[134],"offering":[135],"enhanced":[136],"generalisation":[137],"understanding":[140],"driving":[143],"applications.":[144]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-04-17T18:11:37.981687","created_date":"2025-10-10T00:00:00"}
