{"id":"https://openalex.org/W4416036206","doi":"https://doi.org/10.18653/v1/2025.emnlp-main.855","title":"Do Large Language Models excel in Complex Logical Reasoning with Formal Language?","display_name":"Do Large Language Models excel in Complex Logical Reasoning with Formal Language?","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4416036206","doi":"https://doi.org/10.18653/v1/2025.emnlp-main.855"},"language":null,"primary_location":{"id":"doi:10.18653/v1/2025.emnlp-main.855","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.emnlp-main.855","pdf_url":"https://aclanthology.org/2025.emnlp-main.855.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2025.emnlp-main.855.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101879416","display_name":"Jin Jiang","orcid":"https://orcid.org/0000-0001-6033-609X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jin Jiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100338010","display_name":"Jianing Wang","orcid":"https://orcid.org/0000-0002-9294-2809"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jianing Wang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101121352","display_name":"Yuchen Yan","orcid":"https://orcid.org/0000-0002-7903-8102"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yuchen Yan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100355692","display_name":"Yang Liu","orcid":"https://orcid.org/0000-0001-7300-9215"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang Liu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100514591","display_name":"Jianhua Zhu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jianhua Zhu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100717443","display_name":"Mengdi Zhang","orcid":"https://orcid.org/0000-0002-3239-4804"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mengdi Zhang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5004474713","display_name":"Liangcai Gao","orcid":"https://orcid.org/0000-0001-9444-1568"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liangcai Gao","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5101879416"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.4912,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.95089955,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"16889","last_page":"16914"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11010","display_name":"Logic, Reasoning, and Knowledge","score":0.1445000022649765,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11010","display_name":"Logic, Reasoning, and Knowledge","score":0.1445000022649765,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11596","display_name":"Constraint Satisfaction and Optimization","score":0.07119999825954437,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11303","display_name":"Bayesian Modeling and Causal Inference","score":0.0608999989926815,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/automated-reasoning","display_name":"Automated reasoning","score":0.5778999924659729},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.3587999939918518},{"id":"https://openalex.org/keywords/object-language","display_name":"Object language","score":0.3352999985218048},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.3305000066757202},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.3276999890804291},{"id":"https://openalex.org/keywords/formal-language","display_name":"Formal language","score":0.29679998755455017},{"id":"https://openalex.org/keywords/model-based-reasoning","display_name":"Model-based reasoning","score":0.2962000072002411},{"id":"https://openalex.org/keywords/non-monotonic-logic","display_name":"Non-monotonic logic","score":0.2948000133037567}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6879000067710876},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.5778999924659729},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5023999810218811},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48410001397132874},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.4318000078201294},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.3587999939918518},{"id":"https://openalex.org/C185954173","wikidata":"https://www.wikidata.org/wiki/Q4347052","display_name":"Object language","level":3,"score":0.3352999985218048},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.3305000066757202},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3276999890804291},{"id":"https://openalex.org/C146072743","wikidata":"https://www.wikidata.org/wiki/Q192161","display_name":"Formal language","level":2,"score":0.29679998755455017},{"id":"https://openalex.org/C37335422","wikidata":"https://www.wikidata.org/wiki/Q6888134","display_name":"Model-based reasoning","level":3,"score":0.2962000072002411},{"id":"https://openalex.org/C159032336","wikidata":"https://www.wikidata.org/wiki/Q2488768","display_name":"Non-monotonic logic","level":2,"score":0.2948000133037567},{"id":"https://openalex.org/C179603123","wikidata":"https://www.wikidata.org/wiki/Q1941921","display_name":"Modeling language","level":3,"score":0.2946999967098236},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.2935999929904938},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.28200000524520874},{"id":"https://openalex.org/C86827895","wikidata":"https://www.wikidata.org/wiki/Q7098582","display_name":"Opportunistic reasoning","level":4,"score":0.2745000123977661},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.27079999446868896},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2581000030040741},{"id":"https://openalex.org/C527412718","wikidata":"https://www.wikidata.org/wiki/Q855395","display_name":"Interpretation (philosophy)","level":2,"score":0.2526000142097473},{"id":"https://openalex.org/C161301231","wikidata":"https://www.wikidata.org/wiki/Q3478658","display_name":"Knowledge representation and reasoning","level":2,"score":0.2515999972820282},{"id":"https://openalex.org/C134752490","wikidata":"https://www.wikidata.org/wiki/Q374182","display_name":"Logical consequence","level":2,"score":0.2502000033855438}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2025.emnlp-main.855","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.emnlp-main.855","pdf_url":"https://aclanthology.org/2025.emnlp-main.855.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2025.emnlp-main.855","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.emnlp-main.855","pdf_url":"https://aclanthology.org/2025.emnlp-main.855.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1121271761","display_name":null,"funder_award_id":"Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5939423041","display_name":null,"funder_award_id":"Technology","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7607908787","display_name":null,"funder_award_id":"202404","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4416036206.pdf","grobid_xml":"https://content.openalex.org/works/W4416036206.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"(LLMs)":[3],"have":[4],"been":[5],"shown":[6],"to":[7,24,27,45,130,153],"achieve":[8,159],"breakthrough":[9],"performance":[10,119],"on":[11,20],"complex":[12],"logical":[13,54],"reasoning":[14,30,55,100],"tasks.Nevertheless,":[15],"most":[16],"existing":[17],"research":[18],"focuses":[19],"employing":[21],"formal":[22,58,89,108,156],"language":[23,90,135],"guide":[25],"LLMs":[26,51,95,152],"derive":[28],"reliable":[29],"paths,":[31],"while":[32],"systematic":[33],"evaluations":[34],"of":[35,50,62,67,70,74,103],"these":[36],"capabilities":[37],"are":[38],"still":[39],"limited.In":[40],"this":[41],"paper,":[42],"we":[43,123],"aim":[44],"conduct":[46],"a":[47,107,144],"comprehensive":[48],"evaluation":[49],"across":[52,120,155],"various":[53],"problems":[56],"utilizing":[57],"languages.From":[59],"the":[60,116,126,133,138,160],"perspective":[61],"three":[63],"dimensions,":[64],"i.e.,":[65],"spectrum":[66],"LLMs,":[68],"taxonomy":[69],"tasks,":[71],"and":[72,137,158],"format":[73,114],"trajectories,":[75],"our":[76],"key":[77],"findings":[78],"are:":[79],"1)":[80],"Thinking":[81],"models":[82],"significantly":[83],"outperform":[84],"Instruct":[85],"models,":[86,136],"especially":[87],"when":[88],"is":[91],"employed;":[92],"2)":[93],"All":[94],"exhibit":[96],"limitations":[97],"in":[98],"inductive":[99],"capability,":[101],"irrespective":[102],"whether":[104],"they":[105],"use":[106],"language;":[109],"3)":[110],"Data":[111],"with":[112],"PoT":[113],"achieves":[115],"best":[117,161],"generalization":[118],"other":[121],"languages.Additionally,":[122],"also":[124],"curate":[125],"formal-relative":[127],"training":[128],"data":[129],"further":[131],"enhance":[132],"small":[134],"experimental":[139],"results":[140],"1":[141],"indicate":[142],"that":[143],"simple":[145],"rejected":[146],"fine-tuning":[147],"method":[148],"can":[149],"better":[150],"enable":[151],"generalize":[154],"languages":[157],"overall":[162],"performance.":[163]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-18T07:56:08.524223","created_date":"2025-11-08T00:00:00"}
