{"id":"https://openalex.org/W7140146629","doi":"https://doi.org/10.48550/arxiv.2603.19253","title":"A comprehensive study of LLM-based argument classification: from Llama through DeepSeek to GPT-5.2","display_name":"A comprehensive study of LLM-based argument classification: from Llama through DeepSeek to GPT-5.2","publication_year":2026,"publication_date":"2026-02-25","ids":{"openalex":"https://openalex.org/W7140146629","doi":"https://doi.org/10.48550/arxiv.2603.19253"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.19253","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.19253","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.19253","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036847074","display_name":"Marcin Pietro\u0144","orcid":"https://orcid.org/0000-0001-9357-9231"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Pietro\u0144, Marcin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071407075","display_name":"Filip Gampel","orcid":"https://orcid.org/0000-0001-7698-2440"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gampel, Filip","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087595512","display_name":"Jakub Gomu\u0142ka","orcid":"https://orcid.org/0000-0002-9100-0334"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gomu\u0142ka, Jakub","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130355078","display_name":"Andrzej Tomski","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tomski, Andrzej","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5081668377","display_name":"Rafa\u0142 Olszowski","orcid":"https://orcid.org/0000-0002-4494-3890"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Olszowski, Rafa\u0142","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5036847074"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.5877000093460083,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.5877000093460083,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.0989999994635582,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.05339999869465828,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/argument","display_name":"Argument (complex analysis)","score":0.7946000099182129},{"id":"https://openalex.org/keywords/argumentative","display_name":"Argumentative","score":0.715399980545044},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.5612000226974487},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.559499979019165},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.4772999882698059},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.45910000801086426},{"id":"https://openalex.org/keywords/certainty","display_name":"Certainty","score":0.382099986076355},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.3068999946117401}],"concepts":[{"id":"https://openalex.org/C98184364","wikidata":"https://www.wikidata.org/wiki/Q1780131","display_name":"Argument (complex analysis)","level":2,"score":0.7946000099182129},{"id":"https://openalex.org/C2781306805","wikidata":"https://www.wikidata.org/wiki/Q4789761","display_name":"Argumentative","level":2,"score":0.715399980545044},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6075000166893005},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.5612000226974487},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.559499979019165},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5227000117301941},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.48170000314712524},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.4772999882698059},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.45910000801086426},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.40799999237060547},{"id":"https://openalex.org/C7493553","wikidata":"https://www.wikidata.org/wiki/Q1520777","display_name":"Certainty","level":2,"score":0.382099986076355},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.3068999946117401},{"id":"https://openalex.org/C95986675","wikidata":"https://www.wikidata.org/wiki/Q185168","display_name":"Quantitative analysis (chemistry)","level":2,"score":0.3057999908924103},{"id":"https://openalex.org/C3018587665","wikidata":"https://www.wikidata.org/wiki/Q7268696","display_name":"Qualitative analysis","level":3,"score":0.29649999737739563},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2953000068664551},{"id":"https://openalex.org/C190248442","wikidata":"https://www.wikidata.org/wiki/Q839486","display_name":"Qualitative research","level":2,"score":0.29019999504089355},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.2858000099658966},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.2842999994754791},{"id":"https://openalex.org/C138268822","wikidata":"https://www.wikidata.org/wiki/Q1051925","display_name":"Resolution (logic)","level":2,"score":0.27880001068115234},{"id":"https://openalex.org/C197947376","wikidata":"https://www.wikidata.org/wiki/Q5155608","display_name":"Comparability","level":2,"score":0.27549999952316284},{"id":"https://openalex.org/C72196577","wikidata":"https://www.wikidata.org/wiki/Q1645946","display_name":"Argument map","level":3,"score":0.25920000672340393},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.25769999623298645},{"id":"https://openalex.org/C3018824978","wikidata":"https://www.wikidata.org/wiki/Q2894891","display_name":"Error analysis","level":2,"score":0.2565000057220459},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2551000118255615},{"id":"https://openalex.org/C2780922921","wikidata":"https://www.wikidata.org/wiki/Q255189","display_name":"Paraphrase","level":2,"score":0.2540000081062317}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.19253","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.19253","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.19253","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.19253","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Argument":[0],"mining":[1,211],"(AM)":[2],"is":[3],"an":[4],"interdisciplinary":[5],"research":[6],"field":[7],"focused":[8],"on":[9,65,208],"the":[10,24,38,111,143,149,196],"automatic":[11],"identification":[12],"and":[13,21,23,63,75,90,97,121,131,138,145,187,204],"classification":[14,42,70,116,136],"of":[15,40,55,118,126,148],"argumentative":[16],"components,":[17],"such":[18,72],"as":[19,73],"claims":[20],"premises,":[22],"relationships":[25],"between":[26],"them.":[27],"Recent":[28],"advances":[29],"in":[30,110,179],"large":[31,66],"language":[32],"models":[33,150],"(LLMs)":[34],"have":[35],"significantly":[36],"improved":[37],"performance":[39,95,137],"argument":[41,69,185,210],"compared":[43],"to":[44,103,159,175],"traditional":[45],"machine":[46],"learning":[47],"approaches.":[48],"This":[49,193],"study":[50,112],"presents":[51],"a":[52,115,153],"comprehensive":[53,198],"evaluation":[54,78,199],"several":[56],"state-of-the-art":[57],"LLMs,":[58],"including":[59,83,171],"GPT-5.2,":[60],"Llama":[61],"4,":[62],"DeepSeek,":[64],"publicly":[67],"available":[68],"corpora":[71],"Args.me":[74],"UKP.":[76],"The":[77,107,124],"incorporates":[79],"advanced":[80,214],"prompting":[81,216],"strategies,":[82],"Chain-of-":[84],"Thought":[85],"prompting,":[86],"prompt":[87,127,176],"rephrasing,":[88,128],"voting,":[89,130],"certainty-based":[91],"classification.":[92],"Both":[93],"quantitative":[94,202],"metrics":[96],"qualitative":[98,162,205],"error":[99,206],"analysis":[100,163,207],"are":[101],"conducted":[102],"assess":[104],"model":[105,109],"behavior.":[106],"best-performing":[108],"(GPT-5.2)":[113],"achieves":[114],"accuracy":[117,144],"78.0%":[119],"(UKP)":[120],"91.9%":[122],"(Args.me).":[123],"use":[125],"multi-prompt":[129],"certainty":[132],"estimation":[133],"further":[134],"improves":[135],"robustness.":[139],"These":[140],"techniques":[141],"increase":[142],"F1":[146],"metric":[147],"by":[151],"typically":[152],"few":[154],"percentage":[155],"points":[156],"(from":[157],"2%":[158],"8%).":[160],"However,":[161],"reveals":[164],"systematic":[165],"failure":[166],"modes":[167],"shared":[168],"across":[169],"models,":[170],"instabilities":[172],"with":[173,190],"respect":[174],"formulation,":[177],"difficulties":[178],"detecting":[180],"implicit":[181],"criticism,":[182],"interpreting":[183],"complex":[184],"structures,":[186],"aligning":[188],"arguments":[189],"specific":[191],"claims.":[192],"work":[194],"contributes":[195],"first":[197],"that":[200],"combines":[201],"benchmarking":[203],"multiple":[209],"datasets":[212],"using":[213],"LLM":[215],"strategies.":[217]},"counts_by_year":[],"updated_date":"2026-03-24T06:04:31.470712","created_date":"2026-03-24T00:00:00"}
