{"id":"https://openalex.org/W4417113916","doi":"https://doi.org/10.1145/3769748.3773353","title":"Integrating Multimodal Geo-Semantic Contexts for Traffic Prediction","display_name":"Integrating Multimodal Geo-Semantic Contexts for Traffic Prediction","publication_year":2025,"publication_date":"2025-12-08","ids":{"openalex":"https://openalex.org/W4417113916","doi":"https://doi.org/10.1145/3769748.3773353"},"language":null,"primary_location":{"id":"doi:10.1145/3769748.3773353","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3769748.3773353","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3769748.3773353","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 7th ACM International Conference on Multimedia in Asia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3769748.3773353","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000354904","display_name":"Shuntaro Masuda","orcid":"https://orcid.org/0009-0008-2490-9557"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Shuntaro Masuda","raw_affiliation_strings":["The University of Tokyo, Tokyo, Japan"],"raw_orcid":"https://orcid.org/0009-0008-2490-9557","affiliations":[{"raw_affiliation_string":"The University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002302620","display_name":"Fumiya Matsuno","orcid":"https://orcid.org/0009-0007-0594-5600"},"institutions":[{"id":"https://openalex.org/I4210139992","display_name":"MDS Associates (United States)","ror":"https://ror.org/047bhz389","country_code":"US","type":"company","lineage":["https://openalex.org/I4210139992"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Fumiya Matsuno","raw_affiliation_strings":["MD Inc., Tokyo, Japan"],"raw_orcid":"https://orcid.org/0009-0007-0594-5600","affiliations":[{"raw_affiliation_string":"MD Inc., Tokyo, Japan","institution_ids":["https://openalex.org/I4210139992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120753893","display_name":"Itsuki Hirai","orcid":"https://orcid.org/0009-0004-4536-4446"},"institutions":[{"id":"https://openalex.org/I4210139992","display_name":"MDS Associates (United States)","ror":"https://ror.org/047bhz389","country_code":"US","type":"company","lineage":["https://openalex.org/I4210139992"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Itsuki Hirai","raw_affiliation_strings":["MD Inc., Tokyo, Japan"],"raw_orcid":"https://orcid.org/0009-0004-4536-4446","affiliations":[{"raw_affiliation_string":"MD Inc., Tokyo, Japan","institution_ids":["https://openalex.org/I4210139992"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048624196","display_name":"Toshihiko Yamasaki","orcid":"https://orcid.org/0000-0002-1784-2314"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Toshihiko Yamasaki","raw_affiliation_strings":["The University of Tokyo, Tokyo, Japan"],"raw_orcid":"https://orcid.org/0000-0002-1784-2314","affiliations":[{"raw_affiliation_string":"The University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5000354904"],"corresponding_institution_ids":["https://openalex.org/I74801974"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.39648252,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11344","display_name":"Traffic Prediction and Management Techniques","score":0.4927000105381012,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11344","display_name":"Traffic Prediction and Management Techniques","score":0.4927000105381012,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13282","display_name":"Automated Road and Building Extraction","score":0.43849998712539673,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.010999999940395355,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.6276999711990356},{"id":"https://openalex.org/keywords/satellite-imagery","display_name":"Satellite imagery","score":0.5034000277519226},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.49549999833106995},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.47369998693466187},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.43459999561309814},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.4075999855995178},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.3767000138759613},{"id":"https://openalex.org/keywords/property","display_name":"Property (philosophy)","score":0.359499990940094},{"id":"https://openalex.org/keywords/structured-prediction","display_name":"Structured prediction","score":0.35760000348091125}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6983000040054321},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.6276999711990356},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5393000245094299},{"id":"https://openalex.org/C2778102629","wikidata":"https://www.wikidata.org/wiki/Q725252","display_name":"Satellite imagery","level":2,"score":0.5034000277519226},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.49549999833106995},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.47369998693466187},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4487999975681305},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.43459999561309814},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.4075999855995178},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.3767000138759613},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.359499990940094},{"id":"https://openalex.org/C22367795","wikidata":"https://www.wikidata.org/wiki/Q7625208","display_name":"Structured prediction","level":2,"score":0.35760000348091125},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.35409998893737793},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.3452000021934509},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3345000147819519},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.33149999380111694},{"id":"https://openalex.org/C45804977","wikidata":"https://www.wikidata.org/wiki/Q7239673","display_name":"Predictive modelling","level":2,"score":0.3310000002384186},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.32839998602867126},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.32019999623298645},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.31850001215934753},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2996000051498413},{"id":"https://openalex.org/C70518039","wikidata":"https://www.wikidata.org/wiki/Q16000077","display_name":"Dimensionality reduction","level":2,"score":0.2989000082015991},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.2777000069618225},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.27140000462532043},{"id":"https://openalex.org/C2778827112","wikidata":"https://www.wikidata.org/wiki/Q22245680","display_name":"Feature engineering","level":3,"score":0.2680000066757202},{"id":"https://openalex.org/C20556612","wikidata":"https://www.wikidata.org/wiki/Q4469374","display_name":"Volume (thermodynamics)","level":2,"score":0.2531000077724457}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3769748.3773353","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3769748.3773353","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3769748.3773353","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 7th ACM International Conference on Multimedia in Asia","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3769748.3773353","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3769748.3773353","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3769748.3773353","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 7th ACM International Conference on Multimedia in Asia","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4417113916.pdf","grobid_xml":"https://content.openalex.org/works/W4417113916.grobid-xml"},"referenced_works_count":12,"referenced_works":["https://openalex.org/W1031015364","https://openalex.org/W2040297119","https://openalex.org/W2513506629","https://openalex.org/W2806382623","https://openalex.org/W2976977811","https://openalex.org/W3027716283","https://openalex.org/W3195494505","https://openalex.org/W4281951253","https://openalex.org/W4376616386","https://openalex.org/W4401065398","https://openalex.org/W4401863317","https://openalex.org/W4412888568"],"related_works":[],"abstract_inverted_index":{"Classical":[0],"traffic":[1,13,166],"volume":[2],"prediction":[3,123],"approaches":[4],"rely":[5],"primarily":[6],"on":[7,88],"structured":[8,41,69],"statistical":[9],"data":[10,28,47],"such":[11],"as":[12],"census,":[14],"land":[15],"use,":[16],"and":[17,32,63,77,110,137,168],"property":[18],"values,":[19],"but":[20],"are":[21],"constrained":[22],"by":[23],"insufficient":[24],"incorporation":[25],"of":[26],"unstructured":[27,46],"reflecting":[29],"road":[30,64,90,134,159],"environments":[31],"social":[33],"contexts.":[34],"We":[35],"propose":[36],"a":[37],"novel":[38],"framework":[39],"integrating":[40],"baseline":[42],"features":[43,151],"with":[44,100,125],"multimodal":[45],"through":[48],"Large":[49],"Multimodal":[50],"Models":[51],"(LMMs)":[52],"to":[53,71,82,122],"extract":[54,72],"semantic":[55,150],"information":[56],"from":[57,75],"satellite":[58,126],"imagery,":[59,62],"street":[60,138],"view":[61,139],"names.":[65],"Our":[66],"approach":[67],"uses":[68],"prompts":[70],"qualitative":[73],"assessments":[74],"imagery":[76,127,140],"applies":[78],"pretrained":[79],"vision-language":[80],"encoders":[81],"generate":[83],"unified":[84],"feature":[85],"representations.":[86],"Evaluation":[87],"Tokyo":[89],"segments":[91],"demonstrates":[92],"significant":[93],"improvements":[94],"across":[95],"multiple":[96],"machine":[97],"learning":[98],"models,":[99],"the":[101,129,162],"best":[102],"performing":[103],"model":[104],"achieving":[105],"4.5%":[106],"improvement":[107],"in":[108,113],"R\u00b2":[109],"25.9%":[111],"reduction":[112],"MAPE.":[114],"Ablation":[115],"studies":[116],"reveal":[117],"that":[118,148],"each":[119],"modality":[120],"contributes":[121],"accuracy,":[124],"providing":[128],"strongest":[130],"standalone":[131],"contribution,":[132],"while":[133],"name":[135],"semantics":[136],"show":[141],"strong":[142],"synergistic":[143],"effects.":[144],"SHAP":[145],"analysis":[146],"confirms":[147],"LMM-extracted":[149],"rank":[152],"among":[153],"top":[154],"predictive":[155],"factors":[156],"alongside":[157],"traditional":[158],"attributes,":[160],"demonstrating":[161],"framework\u2019s":[163],"effectiveness":[164],"for":[165],"engineering":[167],"commercial":[169],"location":[170],"intelligence":[171],"applications.":[172]},"counts_by_year":[],"updated_date":"2026-03-14T06:41:57.775601","created_date":"2025-12-08T00:00:00"}
