{"id":"https://openalex.org/W7138058206","doi":"https://doi.org/10.1609/aaai.v40i5.37335","title":"TraveLLaMA: A Multimodal Travel Assistant with Large-Scale Dataset and Structured Reasoning","display_name":"TraveLLaMA: A Multimodal Travel Assistant with Large-Scale Dataset and Structured Reasoning","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138058206","doi":"https://doi.org/10.1609/aaai.v40i5.37335"},"language":null,"primary_location":{"id":"doi:10.1609/aaai.v40i5.37335","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i5.37335","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1609/aaai.v40i5.37335","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129701597","display_name":"Meng Chu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Meng Chu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129737653","display_name":"Yukang Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yukang Chen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119949440","display_name":"Haokun Gui","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Haokun Gui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121128384","display_name":"Shaozuo Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shaozuo Yu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129694574","display_name":"Yi Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yi Wang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129704416","display_name":"Jiaya Jia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiaya Jia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5129701597"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.31831187,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"40","issue":"5","first_page":"3390","last_page":"3398"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.7896999716758728,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.7896999716758728,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11904","display_name":"Spatial Cognition and Navigation","score":0.07989999651908875,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11942","display_name":"Transportation and Mobility Innovations","score":0.01549999974668026,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/usability","display_name":"Usability","score":0.7128999829292297},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5899999737739563},{"id":"https://openalex.org/keywords/knowledge-base","display_name":"Knowledge base","score":0.42239999771118164},{"id":"https://openalex.org/keywords/case-based-reasoning","display_name":"Case-based reasoning","score":0.3846000134944916},{"id":"https://openalex.org/keywords/contextual-design","display_name":"Contextual design","score":0.34610000252723694},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.34369999170303345},{"id":"https://openalex.org/keywords/multimodal-interaction","display_name":"Multimodal interaction","score":0.3287999927997589},{"id":"https://openalex.org/keywords/work","display_name":"Work (physics)","score":0.3203999996185303}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7716000080108643},{"id":"https://openalex.org/C170130773","wikidata":"https://www.wikidata.org/wiki/Q216378","display_name":"Usability","level":2,"score":0.7128999829292297},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5899999737739563},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47110000252723694},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4690000116825104},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.42239999771118164},{"id":"https://openalex.org/C20162079","wikidata":"https://www.wikidata.org/wiki/Q1151406","display_name":"Case-based reasoning","level":2,"score":0.3846000134944916},{"id":"https://openalex.org/C71611378","wikidata":"https://www.wikidata.org/wiki/Q5165191","display_name":"Contextual design","level":3,"score":0.34610000252723694},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.34369999170303345},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3368000090122223},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.33390000462532043},{"id":"https://openalex.org/C135641252","wikidata":"https://www.wikidata.org/wiki/Q738567","display_name":"Multimodal interaction","level":2,"score":0.3287999927997589},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.3203999996185303},{"id":"https://openalex.org/C37335422","wikidata":"https://www.wikidata.org/wiki/Q6888134","display_name":"Model-based reasoning","level":3,"score":0.31940001249313354},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.31470000743865967},{"id":"https://openalex.org/C114073186","wikidata":"https://www.wikidata.org/wiki/Q2631895","display_name":"Automated planning and scheduling","level":2,"score":0.30880001187324524},{"id":"https://openalex.org/C22367795","wikidata":"https://www.wikidata.org/wiki/Q7625208","display_name":"Structured prediction","level":2,"score":0.30489999055862427},{"id":"https://openalex.org/C89288958","wikidata":"https://www.wikidata.org/wiki/Q7301504","display_name":"Reasoning system","level":2,"score":0.3034999966621399},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2939000129699707},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2773999869823456},{"id":"https://openalex.org/C2983448237","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Language understanding","level":2,"score":0.26980000734329224},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.26350000500679016},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.25099998712539673}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v40i5.37335","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i5.37335","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i5.37335","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i5.37335","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/11","score":0.697597086429596,"display_name":"Sustainable cities and communities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Tourism":[0],"and":[1,18,75,78,97,110,152,163,185],"travel":[2,35,47,68,92,148,191],"planning":[3],"increasingly":[4],"rely":[5],"on":[6,124],"digital":[7],"assistance,":[8],"yet":[9],"existing":[10],"multimodal":[11,29,190],"AI":[12,46],"systems":[13],"often":[14],"lack":[15],"specialized":[16,28],"knowledge":[17],"contextual":[19,147],"understanding":[20,154],"of":[21,43,58,179],"urban":[22],"environments.":[23],"We":[24],"present":[25],"TraveLLaMA,":[26],"a":[27,55,86,174],"language":[30],"model":[31,142],"designed":[32],"for":[33,189],"comprehensive":[34],"assistance.":[36],"Our":[37,141],"work":[38],"addresses":[39],"the":[40],"fundamental":[41],"challenge":[42],"developing":[44],"practical":[45,98,157],"assistants":[48],"through":[49,117],"three":[50],"key":[51],"contributions:":[52],"(1)":[53],"TravelQA,":[54],"novel":[56],"dataset":[57],"265k":[59],"question-answer":[60],"pairs":[61],"combining":[62],"160k":[63],"text":[64],"QA":[65,72],"from":[66],"authentic":[67],"sources,":[69],"100k":[70],"vision-language":[71,126],"featuring":[73],"maps":[74],"location":[76],"imagery,":[77],"5k":[79],"expert-annotated":[80],"Chain-of-Thought":[81],"reasoning":[82,88],"examples;":[83],"(2)":[84],"Travel-CoT,":[85],"structured":[87],"framework":[89],"that":[90],"decomposes":[91],"queries":[93],"into":[94],"spatial,":[95],"temporal,":[96],"dimensions,":[99],"improving":[100],"answer":[101],"accuracy":[102],"by":[103,138],"10.8%":[104],"while":[105,155],"providing":[106,156],"interpretable":[107],"decision":[108],"paths;":[109],"(3)":[111],"an":[112],"interactive":[113],"agent":[114],"system":[115],"validated":[116],"extensive":[118],"user":[119],"studies.":[120],"Through":[121],"fine-tuning":[122],"experiments":[123],"state-of-the-art":[125],"models":[127,184],"(LLaVA,":[128],"Qwen-VL,":[129],"Shikra),":[130],"we":[131],"achieve":[132],"6.2-9.4%":[133],"base":[134],"improvements,":[135],"further":[136],"enhanced":[137],"Travel-CoT":[139],"reasoning.":[140],"demonstrates":[143],"superior":[144],"capabilities":[145],"in":[146],"recommendations,":[149],"map":[150],"interpretation,":[151],"scene":[153],"information":[158],"such":[159],"as":[160],"operating":[161],"hours":[162],"cultural":[164],"insights.":[165],"User":[166],"studies":[167],"with":[168],"500":[169],"participants":[170],"show":[171],"TraveLLaMA":[172],"achieves":[173],"System":[175],"Usability":[176],"Scale":[177],"score":[178],"82.5,":[180],"significantly":[181],"outperforming":[182],"general-purpose":[183],"establishing":[186],"new":[187],"standards":[188],"assistance":[192],"systems.":[193]},"counts_by_year":[],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2026-03-18T00:00:00"}
