{"id":"https://openalex.org/W7141265299","doi":"https://doi.org/10.48550/arxiv.2603.25005","title":"Error Understanding in Program Code With LLM-DL for Multi-label Classification","display_name":"Error Understanding in Program Code With LLM-DL for Multi-label Classification","publication_year":2026,"publication_date":"2026-03-26","ids":{"openalex":"https://openalex.org/W7141265299","doi":"https://doi.org/10.48550/arxiv.2603.25005"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.25005","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.25005","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.25005","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5061975231","display_name":"Md Faizul Ibne Amin","orcid":"https://orcid.org/0009-0001-0722-3536"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Amin, Md Faizul Ibne","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026370198","display_name":"Yutaka Watanobe","orcid":"https://orcid.org/0000-0002-0030-3859"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Watanobe, Yutaka","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023926503","display_name":"Md. Mostafizer Rahman","orcid":"https://orcid.org/0000-0001-9368-7638"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rahman, Md. Mostafizer","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045190357","display_name":"Daniel M. Muepu","orcid":"https://orcid.org/0009-0000-0867-3697"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Muepu, Daniel M.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5055764774","display_name":"Md. Shahajada Mia","orcid":"https://orcid.org/0009-0001-6499-410X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mia, Md. Shahajada","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5061975231"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.8816999793052673,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.8816999793052673,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.01510000042617321,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.012000000104308128,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/python","display_name":"Python (programming language)","score":0.6832000017166138},{"id":"https://openalex.org/keywords/hamming-code","display_name":"Hamming code","score":0.5424000024795532},{"id":"https://openalex.org/keywords/jaccard-index","display_name":"Jaccard index","score":0.4643999934196472},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.44359999895095825},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.4138000011444092},{"id":"https://openalex.org/keywords/hamming-distance","display_name":"Hamming distance","score":0.41119998693466187},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.39149999618530273},{"id":"https://openalex.org/keywords/error-detection-and-correction","display_name":"Error detection and correction","score":0.38679999113082886}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7843000292778015},{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.6832000017166138},{"id":"https://openalex.org/C73150493","wikidata":"https://www.wikidata.org/wiki/Q853922","display_name":"Hamming code","level":4,"score":0.5424000024795532},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.539900004863739},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4749000072479248},{"id":"https://openalex.org/C203519979","wikidata":"https://www.wikidata.org/wiki/Q865360","display_name":"Jaccard index","level":3,"score":0.4643999934196472},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.44359999895095825},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.4138000011444092},{"id":"https://openalex.org/C193319292","wikidata":"https://www.wikidata.org/wiki/Q272172","display_name":"Hamming distance","level":2,"score":0.41119998693466187},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.40610000491142273},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.39149999618530273},{"id":"https://openalex.org/C103088060","wikidata":"https://www.wikidata.org/wiki/Q1062839","display_name":"Error detection and correction","level":2,"score":0.38679999113082886},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.38350000977516174},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.3747999966144562},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.3490999937057495},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.34610000252723694},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.3167000114917755},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.2849000096321106},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2840999960899353},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.27639999985694885},{"id":"https://openalex.org/C55166926","wikidata":"https://www.wikidata.org/wiki/Q2892946","display_name":"Oracle","level":2,"score":0.2736999988555908},{"id":"https://openalex.org/C34165917","wikidata":"https://www.wikidata.org/wiki/Q188267","display_name":"Programming paradigm","level":2,"score":0.2612999975681305},{"id":"https://openalex.org/C8642999","wikidata":"https://www.wikidata.org/wiki/Q4171168","display_name":"Hyperparameter","level":2,"score":0.2538999915122986},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.25200000405311584}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.25005","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.25005","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.25005","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.25005","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.6848006248474121}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Programming":[0],"is":[1],"a":[2,65,117,176],"core":[3],"skill":[4],"in":[5,35,44,230],"computer":[6],"science":[7],"and":[8,14,23,39,85,101,113,146,159,163,194,234],"software":[9],"engineering":[10],"(SE),":[11],"yet":[12],"identifying":[13],"resolving":[15],"code":[16,73,121,225],"errors":[17],"remains":[18,56],"challenging":[19],"for":[20,71,218,223],"both":[21,111],"novice":[22],"experienced":[24],"developers.":[25],"While":[26],"Large":[27],"Language":[28],"Models":[29],"(LLMs)":[30],"have":[31,135],"shown":[32],"remarkable":[33],"capabilities":[34],"natural":[36],"language":[37],"understanding":[38],"generation":[40],"tasks,":[41],"their":[42],"potential":[43,228],"domain-specific,":[45],"complex":[46],"scenarios,":[47],"such":[48,96],"as":[49,97],"multi-label":[50,66,140],"classification":[51,68],"(MLC)":[52],"of":[53,179,183,188,192,197,204],"programming":[54,231],"errors,":[55],"underexplored.":[57],"Recognizing":[58],"this":[59,62],"less-explored":[60],"area,":[61],"study":[63],"proposes":[64],"error":[67,122,196],"(MLEC)":[69],"framework":[70],"source":[72],"that":[74,167],"leverages":[75],"fine-tuned":[76],"LLMs,":[77],"including":[78,142],"CodeT5-base,":[79],"GraphCodeBERT,":[80],"CodeT5+,":[81],"UniXcoder,":[82],"RoBERTa,":[83],"PLBART,":[84],"CoTexT.":[86],"These":[87,199],"LLMs":[88],"are":[89],"integrated":[90],"with":[91,103,175,209,227],"deep":[92],"learning":[93],"(DL)":[94],"architectures":[95],"GRU,":[98],"LSTM,":[99],"BiLSTM,":[100],"BiLSTM":[102],"an":[104],"additive":[105],"attention":[106],"mechanism":[107],"(BiLSTM-A)":[108],"to":[109],"capture":[110],"syntactic":[112],"semantic":[114,207],"features":[115],"from":[116],"real-world":[118],"student-written":[119],"Python":[120],"dataset.":[123],"Extensive":[124],"experiments":[125],"across":[126],"32":[127],"model":[128,170],"variants,":[129],"optimized":[130],"using":[131,138],"Optuna-based":[132],"hyperparameter":[133],"tuning,":[134],"been":[136],"evaluated":[137],"comprehensive":[139],"metrics,":[141],"average":[143,181],"accuracy,":[144,153],"macro":[145],"weighted":[147,177],"precision,":[148],"recall,":[149],"F1-score,":[150],"exact":[151,185],"match":[152,186],"One-error,":[154],"Hamming":[155,190],"loss,":[156],"Jaccard":[157],"similarity,":[158],"ROC-AUC":[160],"(micro,":[161],"macro,":[162],"weighted).":[164],"Results":[165],"show":[166],"the":[168,172,202,216],"CodeT5+\\_GRU":[169],"achieved":[171],"strongest":[173],"performance,":[174],"F1-score":[178],"0.8243,":[180],"accuracy":[182,187],"91.84\\%,":[184],"53.78\\%,":[189],"loss":[191],"0.0816,":[193],"One":[195],"0.0708.":[198],"findings":[200],"confirm":[201],"effectiveness":[203],"combining":[205],"pretrained":[206],"encoders":[208],"efficient":[210],"recurrent":[211],"decoders.":[212],"This":[213],"work":[214],"lays":[215],"foundation":[217],"developing":[219],"intelligent,":[220],"scalable":[221],"tools":[222],"automated":[224],"feedback,":[226],"applications":[229],"education":[232],"(PE)":[233],"broader":[235],"SE":[236],"domains.":[237]},"counts_by_year":[],"updated_date":"2026-04-30T09:15:22.047038","created_date":"2026-03-28T00:00:00"}
