{"id":"https://openalex.org/W4394745212","doi":"https://doi.org/10.1145/3597503.3639150","title":"LLMParser: An Exploratory Study on Using Large Language Models for Log Parsing","display_name":"LLMParser: An Exploratory Study on Using Large Language Models for Log Parsing","publication_year":2024,"publication_date":"2024-04-12","ids":{"openalex":"https://openalex.org/W4394745212","doi":"https://doi.org/10.1145/3597503.3639150"},"language":"en","primary_location":{"id":"doi:10.1145/3597503.3639150","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3597503.3639150","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the IEEE/ACM 46th International Conference on Software Engineering","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2404.18001","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5095376985","display_name":"Zeyang Ma","orcid":"https://orcid.org/0000-0002-0390-1547"},"institutions":[{"id":"https://openalex.org/I60158472","display_name":"Concordia University","ror":"https://ror.org/0420zvk78","country_code":"CA","type":"education","lineage":["https://openalex.org/I60158472"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Zeyang Ma","raw_affiliation_strings":["Concordia University, Montreal, Canada"],"raw_orcid":"https://orcid.org/0000-0002-0390-1547","affiliations":[{"raw_affiliation_string":"Concordia University, Montreal, Canada","institution_ids":["https://openalex.org/I60158472"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026999307","display_name":"An Ran Chen","orcid":"https://orcid.org/0000-0003-3137-7540"},"institutions":[{"id":"https://openalex.org/I154425047","display_name":"University of Alberta","ror":"https://ror.org/0160cpw27","country_code":"CA","type":"education","lineage":["https://openalex.org/I154425047"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"An Ran Chen","raw_affiliation_strings":["University of Alberta, Edmonton, Alberta, Canada"],"raw_orcid":"https://orcid.org/0000-0003-3137-7540","affiliations":[{"raw_affiliation_string":"University of Alberta, Edmonton, Alberta, Canada","institution_ids":["https://openalex.org/I154425047"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020218671","display_name":"Dong Jae Kim","orcid":"https://orcid.org/0000-0002-3181-0001"},"institutions":[{"id":"https://openalex.org/I60158472","display_name":"Concordia University","ror":"https://ror.org/0420zvk78","country_code":"CA","type":"education","lineage":["https://openalex.org/I60158472"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Dong Jae Kim","raw_affiliation_strings":["Concordia University, Montreal, Canada"],"raw_orcid":"https://orcid.org/0000-0002-3181-0001","affiliations":[{"raw_affiliation_string":"Concordia University, Montreal, Canada","institution_ids":["https://openalex.org/I60158472"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069372430","display_name":"Tse-Hsun Chen","orcid":"https://orcid.org/0000-0003-4027-0905"},"institutions":[{"id":"https://openalex.org/I60158472","display_name":"Concordia University","ror":"https://ror.org/0420zvk78","country_code":"CA","type":"education","lineage":["https://openalex.org/I60158472"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Tse-Hsun Chen","raw_affiliation_strings":["Concordia University, Montreal, Canada"],"raw_orcid":"https://orcid.org/0000-0003-4027-0905","affiliations":[{"raw_affiliation_string":"Concordia University, Montreal, Canada","institution_ids":["https://openalex.org/I60158472"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100664833","display_name":"Shaowei Wang","orcid":"https://orcid.org/0000-0003-3823-1771"},"institutions":[{"id":"https://openalex.org/I46247651","display_name":"University of Manitoba","ror":"https://ror.org/02gfys938","country_code":"CA","type":"education","lineage":["https://openalex.org/I46247651"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Shaowei Wang","raw_affiliation_strings":["University of Manitoba, Winnipeg, Canada"],"raw_orcid":"https://orcid.org/0000-0003-3823-1771","affiliations":[{"raw_affiliation_string":"University of Manitoba, Winnipeg, Canada","institution_ids":["https://openalex.org/I46247651"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5095376985"],"corresponding_institution_ids":["https://openalex.org/I60158472"],"apc_list":null,"apc_paid":null,"fwci":23.5738,"has_fulltext":true,"cited_by_count":72,"citation_normalized_percentile":{"value":0.99721859,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"13"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10430","display_name":"Software Engineering Techniques and Practices","score":0.9742000102996826,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.8804379105567932},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7702615261077881},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5186287760734558},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.44855695962905884},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.37560001015663147},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3458007276058197}],"concepts":[{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.8804379105567932},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7702615261077881},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5186287760734558},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.44855695962905884},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.37560001015663147},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3458007276058197}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3597503.3639150","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3597503.3639150","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the IEEE/ACM 46th International Conference on Software Engineering","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2404.18001","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.18001","pdf_url":"https://arxiv.org/pdf/2404.18001","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2404.18001","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.18001","pdf_url":"https://arxiv.org/pdf/2404.18001","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4394745212.pdf","grobid_xml":"https://content.openalex.org/works/W4394745212.grobid-xml"},"referenced_works_count":36,"referenced_works":["https://openalex.org/W1661413208","https://openalex.org/W2022686119","https://openalex.org/W2102632804","https://openalex.org/W2153470728","https://openalex.org/W2403646140","https://openalex.org/W2560021099","https://openalex.org/W2592771984","https://openalex.org/W2735591903","https://openalex.org/W2754665629","https://openalex.org/W2755402962","https://openalex.org/W2762028850","https://openalex.org/W2786424616","https://openalex.org/W2811120218","https://openalex.org/W2888115557","https://openalex.org/W2895810692","https://openalex.org/W2947815220","https://openalex.org/W2963999143","https://openalex.org/W2994865335","https://openalex.org/W2999614244","https://openalex.org/W3037424089","https://openalex.org/W3134079112","https://openalex.org/W3173777717","https://openalex.org/W3194274259","https://openalex.org/W3203565869","https://openalex.org/W3208954537","https://openalex.org/W3211022409","https://openalex.org/W3217001695","https://openalex.org/W4206410067","https://openalex.org/W4221079409","https://openalex.org/W4242838928","https://openalex.org/W4280534475","https://openalex.org/W4284692184","https://openalex.org/W4307079201","https://openalex.org/W4309623083","https://openalex.org/W4376142471","https://openalex.org/W4394946189"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W3046775127","https://openalex.org/W3107602296","https://openalex.org/W4394896187","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W6643695","https://openalex.org/W4381248170","https://openalex.org/W4364306694"],"abstract_inverted_index":{"Logs":[0],"are":[1],"important":[2],"in":[3,16,34,93,192,197,204],"modern":[4],"software":[5],"development":[6],"with":[7,162],"runtime":[8],"information.":[9],"Log":[10],"parsing":[11,36,69,108,116,138,183,219],"is":[12],"the":[13,40,48,59,126,222],"first":[14],"step":[15],"many":[17],"log-based":[18],"analyses,":[19],"that":[20,102,142,170],"involve":[21],"extracting":[22],"structured":[23],"information":[24],"from":[25,176],"unstructured":[26],"log":[27,30,43,68,75,137,218,230],"data.":[28],"Traditional":[29],"parsers":[31,112],"face":[32],"challenges":[33],"accurately":[35],"logs":[37,175],"due":[38],"to":[39],"diversity":[41],"of":[42,50,61,97,128,228],"formats,":[44],"which":[45],"directly":[46],"impacts":[47],"performance":[49],"downstream":[51],"log-analysis":[52],"tasks.":[53],"In":[54,207],"this":[55],"paper,":[56],"we":[57],"explore":[58],"potential":[60],"using":[62,171,174,186,215],"Large":[63],"Language":[64],"Models":[65],"(LLMs)":[66],"for":[67,153,214,217],"and":[70,81,91,133,220,224],"propose":[71],"LLMParser,":[72],"an":[73,190],"LLM-based":[74,229],"parser":[76],"based":[77],"on":[78,125,136],"generative":[79],"LLMs":[80,144,172,216],"few-shot":[82],"tuning.":[83],"We":[84,118,140,167],"leverage":[85],"four":[86],"LLMs,":[87],"Flan-T5-small,":[88],"Flan-T5-base,":[89],"LLaMA-7B,":[90],"ChatGLM-6B":[92],"LLMParsers.":[94],"Our":[95],"evaluation":[96],"16":[98],"open-source":[99],"systems":[100,178],"shows":[101,189],"LLMParser":[103],"achieves":[104,157],"statistically":[105],"significantly":[106],"higher":[107],"accuracy":[109],"than":[110,149],"state-of-the-art":[111],"(a":[113],"96%":[114],"average":[115],"accuracy).":[117,206],"further":[119],"conduct":[120],"a":[121,163,198],"comprehensive":[122],"empirical":[123,212],"analysis":[124],"effect":[127],"training":[129],"size,":[130,132],"model":[131],"pre-training":[134],"LLM":[135],"accuracy.":[139,184],"find":[141,169],"smaller":[143],"may":[145],"be":[146],"more":[147,150],"effective":[148],"complex":[151],"LLMs;":[152],"instance":[154],"where":[155],"Flan-T5-base":[156,188],"comparable":[158],"results":[159,196],"as":[160],"LLaMA-7B":[161],"shorter":[164],"inference":[165],"time.":[166],"also":[168],"pre-trained":[173,187,194],"other":[177],"does":[179],"not":[180],"always":[181],"improve":[182],"While":[185],"improvement":[191],"accuracy,":[193],"LLaMA":[195],"decrease":[199],"(decrease":[200],"by":[201],"almost":[202],"55%":[203],"group":[205],"short,":[208],"our":[209],"study":[210],"provides":[211],"evidence":[213],"highlights":[221],"limitations":[223],"future":[225],"research":[226],"direction":[227],"parsers.":[231]},"counts_by_year":[{"year":2026,"cited_by_count":12},{"year":2025,"cited_by_count":48},{"year":2024,"cited_by_count":12}],"updated_date":"2026-05-10T08:33:47.465468","created_date":"2024-04-13T00:00:00"}
