{"id":"https://openalex.org/W4416749048","doi":"https://doi.org/10.1109/iros60139.2025.11246452","title":"LATMOS: Latent Automaton Task Model from Observation Sequences","display_name":"LATMOS: Latent Automaton Task Model from Observation Sequences","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W4416749048","doi":"https://doi.org/10.1109/iros60139.2025.11246452"},"language":null,"primary_location":{"id":"doi:10.1109/iros60139.2025.11246452","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros60139.2025.11246452","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053685990","display_name":"Weixiao Zhan","orcid":"https://orcid.org/0000-0003-2091-9797"},"institutions":[{"id":"https://openalex.org/I160856358","display_name":"University of San Diego","ror":"https://ror.org/03jbbze48","country_code":"US","type":"education","lineage":["https://openalex.org/I160856358"]},{"id":"https://openalex.org/I36258959","display_name":"University of California San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Weixiao Zhan","raw_affiliation_strings":["University of California San Diego,Department of Computer Science and Engineering,CA,USA,92093"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California San Diego,Department of Computer Science and Engineering,CA,USA,92093","institution_ids":["https://openalex.org/I36258959","https://openalex.org/I160856358"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Qiyue Dong","orcid":null},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Qiyue Dong","raw_affiliation_strings":["University of California San Diego,Department of Electrical and Computer Engineering,CA,USA,92093"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California San Diego,Department of Electrical and Computer Engineering,CA,USA,92093","institution_ids":["https://openalex.org/I36258959"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102919228","display_name":"Eduardo Sebasti\u00e1n","orcid":"https://orcid.org/0000-0001-9671-4056"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Eduardo Sebasti\u00e1n","raw_affiliation_strings":["University of Cambridge,Department of Computer Science and Technology,Cambridge,UK,CB3 0FD"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Cambridge,Department of Computer Science and Technology,Cambridge,UK,CB3 0FD","institution_ids":["https://openalex.org/I241749"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066400889","display_name":"Nikolay Atanasov","orcid":"https://orcid.org/0000-0003-0272-7580"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nikolay Atanasov","raw_affiliation_strings":["University of California San Diego,Department of Electrical and Computer Engineering,CA,USA,92093"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California San Diego,Department of Electrical and Computer Engineering,CA,USA,92093","institution_ids":["https://openalex.org/I36258959"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.40154681,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"21032","last_page":"21039"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.33959999680519104,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.33959999680519104,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.23800000548362732,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.06989999860525131,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6807000041007996},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6186000108718872},{"id":"https://openalex.org/keywords/executable","display_name":"Executable","score":0.565500020980835},{"id":"https://openalex.org/keywords/automaton","display_name":"Automaton","score":0.5239999890327454},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.46950000524520874},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.4629000127315521},{"id":"https://openalex.org/keywords/finite-state-machine","display_name":"Finite-state machine","score":0.3813999891281128},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.37689998745918274}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7803999781608582},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6807000041007996},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6186000108718872},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6074000000953674},{"id":"https://openalex.org/C160145156","wikidata":"https://www.wikidata.org/wiki/Q778586","display_name":"Executable","level":2,"score":0.565500020980835},{"id":"https://openalex.org/C112505250","wikidata":"https://www.wikidata.org/wiki/Q787116","display_name":"Automaton","level":2,"score":0.5239999890327454},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.46950000524520874},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.4629000127315521},{"id":"https://openalex.org/C167822520","wikidata":"https://www.wikidata.org/wiki/Q176452","display_name":"Finite-state machine","level":2,"score":0.3813999891281128},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.37689998745918274},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.3659000098705292},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.3357999920845032},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.33489999175071716},{"id":"https://openalex.org/C2776505523","wikidata":"https://www.wikidata.org/wiki/Q4785468","display_name":"Plan (archaeology)","level":2,"score":0.33079999685287476},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3305000066757202},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3215999901294708},{"id":"https://openalex.org/C2776228582","wikidata":"https://www.wikidata.org/wiki/Q7455797","display_name":"Service robot","level":3,"score":0.2962999939918518},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.28209999203681946},{"id":"https://openalex.org/C2779038628","wikidata":"https://www.wikidata.org/wiki/Q7248497","display_name":"Programming by demonstration","level":3,"score":0.26409998536109924},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.2563000023365021},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.25440001487731934},{"id":"https://openalex.org/C165753454","wikidata":"https://www.wikidata.org/wiki/Q1020380","display_name":"B\u00fcchi automaton","level":4,"score":0.2542000114917755},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.2508000135421753},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.2502000033855438}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros60139.2025.11246452","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros60139.2025.11246452","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W187068044","https://openalex.org/W1499727625","https://openalex.org/W1512310098","https://openalex.org/W1969483458","https://openalex.org/W1989445634","https://openalex.org/W2082863623","https://openalex.org/W2144588269","https://openalex.org/W2151958719","https://openalex.org/W2163941698","https://openalex.org/W2235884325","https://openalex.org/W2295721640","https://openalex.org/W2406438973","https://openalex.org/W2899953468","https://openalex.org/W2966183138","https://openalex.org/W3033621224","https://openalex.org/W3091670144","https://openalex.org/W3094503932","https://openalex.org/W3176904019","https://openalex.org/W3186824508","https://openalex.org/W3194226733","https://openalex.org/W4210600503","https://openalex.org/W4312372834","https://openalex.org/W4312614039","https://openalex.org/W4317207462","https://openalex.org/W4319159951","https://openalex.org/W4385245566","https://openalex.org/W4390873954","https://openalex.org/W4390874280","https://openalex.org/W4399951492","https://openalex.org/W4401413894","https://openalex.org/W4401414087","https://openalex.org/W4402402057","https://openalex.org/W4402727748","https://openalex.org/W4403923224","https://openalex.org/W4405787555","https://openalex.org/W4413925878","https://openalex.org/W4413945685","https://openalex.org/W4413945948"],"related_works":[],"abstract_inverted_index":{"Robot":[0],"task":[1,25,50,61,72,79,125,151],"planning":[2,26,57,91],"from":[3,52,77,101],"high-level":[4],"instructions":[5],"is":[6,81],"an":[7,70,95,111],"important":[8],"step":[9],"towards":[10],"deploying":[11],"fully":[12],"autonomous":[13],"robot":[14,24,150],"systems":[15],"in":[16,115,123],"the":[17,48,85,116],"service":[18],"sector.":[19],"Three":[20],"key":[21],"aspects":[22],"of":[23,37,47,60,167],"present":[27],"challenges":[28],"yet":[29],"to":[30,83,98],"be":[31],"resolved":[32],"simultaneously,":[33],"namely,":[34],"(i)":[35,129],"factorization":[36],"complex":[38],"tasks":[39,131,139],"specifications":[40],"into":[41],"simpler":[42],"executable":[43],"subtasks,":[44],"(ii)":[45,136],"understanding":[46],"current":[49],"state":[51,156],"raw":[53],"observations,":[54],"and":[55,58,90,143,147,155,164,173],"(iii)":[56,148],"verification":[59,89,165],"executions.":[62],"To":[63],"address":[64],"these":[65],"challenges,":[66],"we":[67],"propose":[68],"LATMOS,":[69],"automata-theory-inspired":[71],"model":[73,108,126],"that,":[74],"given":[75],"observations":[76,104],"correct":[78],"executions,":[80],"able":[82],"factorize":[84],"task,":[86],"while":[87],"supporting":[88],"operations.":[92],"LATMOS":[93,168],"combines":[94],"observation":[96,171],"encoder":[97],"extract":[99],"features":[100],"potentially":[102],"high-dimensional":[103],"with":[105,113],"a":[106,149],"sequence":[107],"that":[109],"encapsulates":[110],"automaton":[112],"symbols":[114],"latent":[117],"feature":[118],"space.":[119],"We":[120],"conduct":[121],"evaluations":[122],"three":[124],"learning":[127],"setups:":[128],"abstract":[130],"described":[132,140,152],"by":[133,141,153],"logical":[134],"formulas,":[135],"real-world":[137],"human":[138],"videos":[142],"natural":[144],"language":[145],"prompts":[146],"image":[154],"observations.":[157],"The":[158],"results":[159],"show":[160],"improved":[161],"plan":[162],"generation":[163],"capabilities":[166],"across":[169],"different":[170],"modalities":[172],"tasks.":[174]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-11-28T00:00:00"}
