{"id":"https://openalex.org/W4412888883","doi":"https://doi.org/10.18653/v1/2025.findings-acl.42","title":"First-Step Advantage: Importance of Starting Right in Multi-Step Math Reasoning","display_name":"First-Step Advantage: Importance of Starting Right in Multi-Step Math Reasoning","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4412888883","doi":"https://doi.org/10.18653/v1/2025.findings-acl.42"},"language":"en","primary_location":{"id":"doi:10.18653/v1/2025.findings-acl.42","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.findings-acl.42","pdf_url":"https://aclanthology.org/2025.findings-acl.42.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Findings of the Association for Computational Linguistics: ACL 2025","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2025.findings-acl.42.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5079270064","display_name":"Kushal Jain","orcid":"https://orcid.org/0000-0001-7259-976X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kushal Jain","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119181509","display_name":"Moritz Miller","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Moritz Miller","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052882677","display_name":"Niket Tandon","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Niket Tandon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5031480753","display_name":"Kumar Shridhar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kumar Shridhar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.18149827,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"766","last_page":"778"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10636","display_name":"Innovative Teaching and Learning Methods","score":0.8165000081062317,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10636","display_name":"Innovative Teaching and Learning Methods","score":0.8165000081062317,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.8001999855041504,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10130","display_name":"Mathematics Education and Teaching Techniques","score":0.795199990272522,"subfield":{"id":"https://openalex.org/subfields/3304","display_name":"Education"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5454257130622864}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5454257130622864}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2025.findings-acl.42","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.findings-acl.42","pdf_url":"https://aclanthology.org/2025.findings-acl.42.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Findings of the Association for Computational Linguistics: ACL 2025","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2025.findings-acl.42","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.findings-acl.42","pdf_url":"https://aclanthology.org/2025.findings-acl.42.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Findings of the Association for Computational Linguistics: ACL 2025","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.4099999964237213,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4412888883.pdf","grobid_xml":"https://content.openalex.org/works/W4412888883.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Language":[0],"models":[1,17,88,139],"can":[2,45,131],"solve":[3,21,46],"complex":[4],"reasoning":[5,118],"tasks":[6],"better":[7],"by":[8,59,82],"learning":[9],"to":[10,20,30,64,70,75,85,106,133,143,166],"generate":[11],"rationales":[12],"for":[13,120],"their":[14,25],"predictions.Often":[15],"these":[16],"know":[18],"how":[19,105],"a":[22,47,61,99,111],"task,":[23],"but":[24],"auto-regressive":[26],"decoding":[27],"nature":[28],"leads":[29,69],"incorrect":[31],"results":[32],"if":[33],"they":[34,50],"start":[35,130],"incorrectly.We":[36],"observe":[37],"that":[38,49,126],"smaller":[39,66,87,100,122],"models,":[40,67,123],"in":[41,89,162,171],"particular,":[42],"when":[43],"corrected,":[44],"task":[48],"would":[51],"have":[52],"otherwise":[53],"struggled":[54],"with.We":[55],"demonstrate":[56],"this":[57],"phenomenon":[58],"using":[60],"larger":[62],"model":[63,101],"guide":[65],"which":[68],"significantly":[71],"improved":[72],"performance":[73,135],"(up":[74],"+24":[76],"points":[77,145],"on":[78,146,149,152,156],"the":[79,91,128],"GSM8K":[80],"dataset":[81],"7B":[83],"models).Furthermore,":[84],"assist":[86],"initiating":[90],"starting":[92],"step":[93],"correctly,":[94],"we":[95,124],"propose":[96],"QuestCoT,":[97],"where":[98],"first":[102],"asks":[103],"itself":[104],"start,":[107],"before":[108],"proceeding":[109],"with":[110],"chain":[112],"of":[113,141,168],"reasoning.On":[114],"various":[115],"multistep":[116],"mathematical":[117],"datasets":[119],"multiple":[121],"show":[125],"getting":[127],"right":[129],"lead":[132],"significant":[134],"gains":[136],"across":[137],"all":[138],"(gains":[140],"up":[142],"+6":[144],"GSM8K,":[147],"+9":[148],"SVAMP,":[150],"+5":[151],"ASDiv,":[153],"and":[154],"+7":[155],"MultiArith).":[157],"LMNatalia":[158],"sold":[159,164],"48+72=120":[160],"clips":[161,165],"total.Natalia":[163],"48":[167],"her":[169],"friends":[170],"April....":[172]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
