{"id":"https://openalex.org/W7151295280","doi":"https://doi.org/10.48550/arxiv.2604.04106","title":"InsTraj: Instructing Diffusion Models with Travel Intentions to Generate Real-world Trajectories","display_name":"InsTraj: Instructing Diffusion Models with Travel Intentions to Generate Real-world Trajectories","publication_year":2026,"publication_date":"2026-04-05","ids":{"openalex":"https://openalex.org/W7151295280","doi":"https://doi.org/10.48550/arxiv.2604.04106"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.04106","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.04106","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.04106","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084537731","display_name":"Yuanshao Zhu","orcid":"https://orcid.org/0000-0002-5657-181X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhu, Yuanshao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133103404","display_name":"Yuxuan Liang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liang, Yuxuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133128519","display_name":"Xiangyu Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Xiangyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133112656","display_name":"Liang Han","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Liang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133118663","display_name":"Xinwei Fang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fang, Xinwei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133130762","display_name":"Xuetao Wei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Xun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133087513","display_name":"James Jianqiao Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei, Xuetao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Yu, James Jianqiao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, James Jianqiao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5084537731"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11980","display_name":"Human Mobility and Location-Based Analysis","score":0.46959999203681946,"subfield":{"id":"https://openalex.org/subfields/3313","display_name":"Transportation"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11980","display_name":"Human Mobility and Location-Based Analysis","score":0.46959999203681946,"subfield":{"id":"https://openalex.org/subfields/3313","display_name":"Transportation"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.11900000274181366,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.0803999975323677,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bridging","display_name":"Bridging (networking)","score":0.5866000056266785},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.5824000239372253},{"id":"https://openalex.org/keywords/natural-language-understanding","display_name":"Natural language understanding","score":0.4514999985694885},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.4189000129699707},{"id":"https://openalex.org/keywords/global-positioning-system","display_name":"Global Positioning System","score":0.41749998927116394},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.3763999938964844},{"id":"https://openalex.org/keywords/decipher","display_name":"DECIPHER","score":0.3756999969482422},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.3727000057697296}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7932000160217285},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.5866000056266785},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.5824000239372253},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5457000136375427},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.4514999985694885},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4189000129699707},{"id":"https://openalex.org/C60229501","wikidata":"https://www.wikidata.org/wiki/Q18822","display_name":"Global Positioning System","level":2,"score":0.41749998927116394},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.3763999938964844},{"id":"https://openalex.org/C164614171","wikidata":"https://www.wikidata.org/wiki/Q5204775","display_name":"DECIPHER","level":2,"score":0.3756999969482422},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3727000057697296},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.3614000082015991},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.361299991607666},{"id":"https://openalex.org/C86034646","wikidata":"https://www.wikidata.org/wiki/Q474311","display_name":"Semantic gap","level":4,"score":0.3546000123023987},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.3504999876022339},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2955000102519989},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2915000021457672},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.2913999855518341},{"id":"https://openalex.org/C2779231336","wikidata":"https://www.wikidata.org/wiki/Q7534724","display_name":"Sketch","level":2,"score":0.2825999855995178},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.28189998865127563},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.27230000495910645},{"id":"https://openalex.org/C2776650193","wikidata":"https://www.wikidata.org/wiki/Q264661","display_name":"Obstacle","level":2,"score":0.2712000012397766},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2662000060081482},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2624000012874603},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.25999999046325684},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.25029999017715454}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.04106","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.04106","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.04106","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.04106","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/11","display_name":"Sustainable cities and communities","score":0.8039817214012146}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"generation":[1],"of":[2],"realistic":[3,51],"and":[4,19,42,102,109,127,155],"controllable":[5],"GPS":[6],"trajectories":[7,73,129,150],"is":[8],"a":[9,27,63,83,114],"fundamental":[10],"task":[11],"for":[12],"applications":[13],"in":[14,54,94,148],"urban":[15],"planning,":[16],"mobility":[17],"simulation,":[18],"privacy-preserving":[20],"data":[21],"sharing.":[22],"However,":[23],"existing":[24],"methods":[25,147],"face":[26],"two-fold":[28],"challenge:":[29],"they":[30],"lack":[31],"the":[32,50,104,159],"deep":[33],"semantic":[34,100,122],"understanding":[35],"to":[36,44,70,88,124,132,158],"interpret":[37],"complex":[38,46],"user":[39,134],"travel":[40,91],"intent,":[41],"struggle":[43],"handle":[45],"constraints":[47],"while":[48],"maintaining":[49],"diversity":[52],"inherent":[53],"human":[55],"behavior.":[56],"To":[57],"resolve":[58],"this,":[59],"we":[60,112],"introduce":[61],"InsTraj,":[62],"novel":[64],"framework":[65],"that":[66,119,130,142,151],"instructs":[67],"diffusion":[68,117],"models":[69],"generate":[71,125],"high-fidelity":[72,126],"directly":[74],"from":[75],"natural":[76,95],"language":[77,86],"descriptions.":[78],"Specifically,":[79],"InsTraj":[80,143],"first":[81],"utilizes":[82],"powerful":[84],"large":[85],"model":[87],"decipher":[89],"unstructured":[90],"intentions":[92,108],"formed":[93],"language,":[96],"thereby":[97],"creating":[98],"rich":[99],"blueprints":[101],"bridging":[103],"representation":[105],"gap":[106],"between":[107],"trajectories.":[110],"Subsequently,":[111],"proposed":[113],"multimodal":[115],"trajectory":[116],"transformer":[118],"can":[120],"integrate":[121],"guidance":[123],"instruction-faithful":[128],"adhere":[131],"fine-grained":[133],"intent.":[135],"Comprehensive":[136],"experiments":[137],"on":[138],"real-world":[139],"datasets":[140],"demonstrate":[141],"significantly":[144],"outperforms":[145],"state-of-the-art":[146],"generating":[149],"are":[152],"realistic,":[153],"diverse,":[154],"semantically":[156],"faithful":[157],"input":[160],"instructions.":[161]},"counts_by_year":[],"updated_date":"2026-05-06T06:03:25.996018","created_date":"2026-04-08T00:00:00"}
