{"id":"https://openalex.org/W4416035170","doi":"https://doi.org/10.18653/v1/2025.emnlp-main.1772","title":"FoREST: Frame of Reference Evaluation in Spatial Reasoning Tasks","display_name":"FoREST: Frame of Reference Evaluation in Spatial Reasoning Tasks","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4416035170","doi":"https://doi.org/10.18653/v1/2025.emnlp-main.1772"},"language":null,"primary_location":{"id":"doi:10.18653/v1/2025.emnlp-main.1772","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.emnlp-main.1772","pdf_url":"https://aclanthology.org/2025.emnlp-main.1772.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2025.emnlp-main.1772.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000549690","display_name":"Tanawan Premsri","orcid":null},"institutions":[{"id":"https://openalex.org/I87216513","display_name":"Michigan State University","ror":"https://ror.org/05hs6h993","country_code":"US","type":"education","lineage":["https://openalex.org/I87216513"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Tanawan Premsri","raw_affiliation_strings":["Department of Computer Science and Engineering Michigan State University"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering Michigan State University","institution_ids":["https://openalex.org/I87216513"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5087682739","display_name":"Parisa Kordjamshidi","orcid":"https://orcid.org/0000-0002-4606-1824"},"institutions":[{"id":"https://openalex.org/I87216513","display_name":"Michigan State University","ror":"https://ror.org/05hs6h993","country_code":"US","type":"education","lineage":["https://openalex.org/I87216513"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Parisa Kordjamshidi","raw_affiliation_strings":["Department of Computer Science and Engineering Michigan State University"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering Michigan State University","institution_ids":["https://openalex.org/I87216513"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5000549690"],"corresponding_institution_ids":["https://openalex.org/I87216513"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.38782351,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"34965","last_page":"34991"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11904","display_name":"Spatial Cognition and Navigation","score":0.6018999814987183,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11904","display_name":"Spatial Cognition and Navigation","score":0.6018999814987183,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11596","display_name":"Constraint Satisfaction and Optimization","score":0.29170000553131104,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.010700000450015068,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.5331000089645386},{"id":"https://openalex.org/keywords/reference-frame","display_name":"Reference frame","score":0.3176000118255615},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.3125999867916107},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.30709999799728394},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.2867000102996826},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.2799000144004822}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6432999968528748},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5817999839782715},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.5331000089645386},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4187000095844269},{"id":"https://openalex.org/C172849965","wikidata":"https://www.wikidata.org/wiki/Q3148875","display_name":"Reference frame","level":3,"score":0.3176000118255615},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.3125999867916107},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.30709999799728394},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.2867000102996826},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.2799000144004822},{"id":"https://openalex.org/C74992021","wikidata":"https://www.wikidata.org/wiki/Q184876","display_name":"Frame of reference","level":2,"score":0.26330000162124634},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.26170000433921814},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.26100000739097595},{"id":"https://openalex.org/C155911833","wikidata":"https://www.wikidata.org/wiki/Q3817354","display_name":"Spatial intelligence","level":2,"score":0.2572000026702881},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.25270000100135803},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.25040000677108765}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2025.emnlp-main.1772","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.emnlp-main.1772","pdf_url":"https://aclanthology.org/2025.emnlp-main.1772.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2025.emnlp-main.1772","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.emnlp-main.1772","pdf_url":"https://aclanthology.org/2025.emnlp-main.1772.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4416035170.pdf","grobid_xml":"https://content.openalex.org/works/W4416035170.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Spatial":[0,69],"reasoning":[1,152],"is":[2,14,41,167,179,189,203,220],"a":[3,42,100,172,225],"fundamental":[4],"aspect":[5],"of":[6,17,24,44,50,65,157,171,224],"human":[7],"intelligence.One":[8],"key":[9],"concept":[10],"in":[11,34,55,68,79,93,108,124,207],"spatial":[12,25,39,141,151],"cognition":[13],"the":[15,22,63,169,175,182,190,193,199,204,210,222],"Frame":[16,64],"Reference":[18,66],"(FoR),":[19],"which":[20,134],"identifies":[21],"perspective":[23,214,216],"expressions.Despite":[26],"its":[27],"significance,":[28],"FoR":[29,77,88,106,125,128],"has":[30],"received":[31],"limited":[32],"attention":[33],"AI":[35],"models":[36,53,95],"that":[37,86],"need":[38],"intelligence.There":[40],"lack":[43],"dedicated":[45],"benchmarks":[46],"and":[47,90,143],"in-depth":[48],"evaluation":[49],"large":[51],"language":[52],"(LLMs)":[54],"this":[56,59],"area.To":[57],"address":[58],"issue,":[60],"we":[61,130],"introduce":[62],"Evaluation":[67],"Reasoning":[70],"Tasks":[71],"(FoREST)":[72],"benchmark,":[73],"designed":[74],"to":[75,114,138,168,209,221],"assess":[76],"comprehension":[78,89],"LLMs.We":[80],"evaluate":[81],"LLMs":[82],"on":[83,185],"answering":[84],"questions":[85],"require":[87],"layout":[91],"generation":[92],"textto-image":[94],"using":[96],"FoREST.Our":[97],"results":[98],"reveal":[99],"notable":[101],"performance":[102,149],"gap":[103],"across":[104,150],"different":[105],"classes":[107],"various":[109],"LLMs,":[110],"affecting":[111],"their":[112],"ability":[113,137],"generate":[115],"accurate":[116],"layouts":[117],"for":[118],"text-toimage":[119],"generation.This":[120],"highlights":[121],"critical":[122],"shortcomings":[123],"comprehension.To":[126],"improve":[127],"understanding,":[129],"propose":[131],"Spatial-Guided":[132],"prompting,":[133],"improves":[135,147],"LLMs'":[136],"extract":[139],"primitive":[140],"concepts":[142],"relations.Our":[144],"proposed":[145],"method":[146],"overall":[148],"tasks.":[153],"Context":[154],"Generation":[155],"List":[156],"ObjectsLocatum":[158],"(L)":[159],"Relatum":[160],"(R)":[161],"<L>":[162],"<relation>":[163],"<R>":[164],"A":[165,218],"cat":[166,191,205,219,227],"right":[170,223],"dog":[173,178,200],"from":[174,192],"dog's":[176,194],"perspective.A":[177],"facing":[180],"toward":[181],"camera.Q:":[183],"Based":[184],"camera":[186],"angle,":[187],"where":[188],"position?A:":[195],"Left":[196],"Q:":[197],"In":[198],"view,":[201],"how":[202],"positioned":[206],"relation":[208],"dog?A:":[211],"Right":[212],"Camera's":[213],"Relatum's":[215],"Visualization":[217],"dog.dog":[226]},"counts_by_year":[],"updated_date":"2026-03-08T06:56:09.383167","created_date":"2025-11-08T00:00:00"}
