{"id":"https://openalex.org/W4415594438","doi":"https://doi.org/10.1109/tse.2025.3625121","title":"SemanticLog: Towards Effective and Efficient Large-Scale Semantic Log Parsing","display_name":"SemanticLog: Towards Effective and Efficient Large-Scale Semantic Log Parsing","publication_year":2025,"publication_date":"2025-10-27","ids":{"openalex":"https://openalex.org/W4415594438","doi":"https://doi.org/10.1109/tse.2025.3625121"},"language":null,"primary_location":{"id":"doi:10.1109/tse.2025.3625121","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tse.2025.3625121","pdf_url":null,"source":{"id":"https://openalex.org/S8351582","display_name":"IEEE Transactions on Software Engineering","issn_l":"0098-5589","issn":["0098-5589","1939-3520","2326-3881"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Software Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101636992","display_name":"Chenbo Zhang","orcid":"https://orcid.org/0009-0009-1779-8040"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chenbo Zhang","raw_affiliation_strings":["Shanghai Key Lab of Intelligent Information Processing, and the School of Computer Science and Artificial Intelligence, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Lab of Intelligent Information Processing, and the School of Computer Science and Artificial Intelligence, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036668090","display_name":"Wenying Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenying Xu","raw_affiliation_strings":["Shanghai Key Lab of Intelligent Information Processing, and the School of Computer Science and Artificial Intelligence, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Lab of Intelligent Information Processing, and the School of Computer Science and Artificial Intelligence, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017058942","display_name":"Jinbu Liu","orcid":"https://orcid.org/0009-0004-5933-2971"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinbu Liu","raw_affiliation_strings":["Alibaba Group, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Hangzhou, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100388587","display_name":"Lu Zhang","orcid":"https://orcid.org/0000-0001-9532-5219"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lu Zhang","raw_affiliation_strings":["Shanghai Key Lab of Intelligent Information Processing, and the School of Computer Science and Artificial Intelligence, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Lab of Intelligent Information Processing, and the School of Computer Science and Artificial Intelligence, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081766211","display_name":"Guiyang Liu","orcid":"https://orcid.org/0009-0000-3383-9409"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guiyang Liu","raw_affiliation_strings":["Alibaba Group, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Hangzhou, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086316879","display_name":"Jihong Guan","orcid":"https://orcid.org/0000-0003-2313-7635"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jihong Guan","raw_affiliation_strings":["School of Computer Science and Technology, Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101631796","display_name":"Qi Zhou","orcid":"https://orcid.org/0000-0002-7759-800X"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Zhou","raw_affiliation_strings":["Alibaba Group, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Hangzhou, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017862559","display_name":"Shuigeng Zhou","orcid":"https://orcid.org/0000-0002-1949-2768"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuigeng Zhou","raw_affiliation_strings":["Shanghai Key Lab of Intelligent Information Processing, and the School of Computer Science and Artificial Intelligence, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Lab of Intelligent Information Processing, and the School of Computer Science and Artificial Intelligence, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5101636992"],"corresponding_institution_ids":["https://openalex.org/I24943067"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.16487566,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"52","issue":"1","first_page":"155","last_page":"170"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9740999937057495,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9740999937057495,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9706000089645386,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12205","display_name":"Time Series Analysis and Forecasting","score":0.9327999949455261,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.8440999984741211},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.42010000348091125},{"id":"https://openalex.org/keywords/parse-tree","display_name":"Parse tree","score":0.4169999957084656},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.3982999920845032},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.39250001311302185},{"id":"https://openalex.org/keywords/semantic-analysis","display_name":"Semantic analysis (machine learning)","score":0.3206000030040741},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.3172000050544739}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9085000157356262},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.8440999984741211},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5726000070571899},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4756999909877777},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.42010000348091125},{"id":"https://openalex.org/C2781466058","wikidata":"https://www.wikidata.org/wiki/Q627921","display_name":"Parse tree","level":3,"score":0.4169999957084656},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.3982999920845032},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.39250001311302185},{"id":"https://openalex.org/C2777946921","wikidata":"https://www.wikidata.org/wiki/Q7449044","display_name":"Semantic analysis (machine learning)","level":2,"score":0.3206000030040741},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.3172000050544739},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3149000108242035},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.30570000410079956},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.287200003862381},{"id":"https://openalex.org/C53893814","wikidata":"https://www.wikidata.org/wiki/Q7378909","display_name":"Rule-based machine translation","level":2,"score":0.2863999903202057},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2687999904155731},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.2671999931335449},{"id":"https://openalex.org/C118364021","wikidata":"https://www.wikidata.org/wiki/Q7139956","display_name":"Parser combinator","level":3,"score":0.266400009393692},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2637999951839447},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.2556999921798706}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tse.2025.3625121","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tse.2025.3625121","pdf_url":null,"source":{"id":"https://openalex.org/S8351582","display_name":"IEEE Transactions on Software Engineering","issn_l":"0098-5589","issn":["0098-5589","1939-3520","2326-3881"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Software Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W2039157918","https://openalex.org/W2115056012","https://openalex.org/W2562383263","https://openalex.org/W2583874385","https://openalex.org/W2754665629","https://openalex.org/W2755402962","https://openalex.org/W2767094836","https://openalex.org/W2947815220","https://openalex.org/W2963999143","https://openalex.org/W3041215671","https://openalex.org/W3163667769","https://openalex.org/W3167387776","https://openalex.org/W3195057108","https://openalex.org/W3203565869","https://openalex.org/W4221079409","https://openalex.org/W4226128225","https://openalex.org/W4239854741","https://openalex.org/W4284692184","https://openalex.org/W4285294723","https://openalex.org/W4308642996","https://openalex.org/W4316661025","https://openalex.org/W4321354332","https://openalex.org/W4367146761","https://openalex.org/W4379116564","https://openalex.org/W4384345672","https://openalex.org/W4384345673","https://openalex.org/W4384345785","https://openalex.org/W4385245566","https://openalex.org/W4388483129","https://openalex.org/W4391579685","https://openalex.org/W4393158805","https://openalex.org/W4394745212","https://openalex.org/W4400583111","https://openalex.org/W4404782964","https://openalex.org/W4411450161"],"related_works":[],"abstract_inverted_index":{"Logs":[0],"of":[1,20,83,102,151,226,263],"large-scale":[2,207],"cloud":[3],"systems":[4],"record":[5],"diverse":[6],"system":[7],"events,":[8],"ranging":[9],"from":[10,76,173],"routine":[11],"statuses":[12],"to":[13,27,98,126,153,183,251],"critical":[14],"errors.":[15],"As":[16],"the":[17,81,100,115,149,154,200,212,220],"fundamental":[18],"step":[19],"automated":[21],"log":[22,24,104,119,141,155,164,174,222,264],"analysis,":[23],"parsing":[25,120,156,241],"is":[26],"transform":[28],"unstructured":[29],"logs":[30],"into":[31],"structured":[32],"data":[33,165,265],"for":[34,86,109,117,203],"easier":[35],"management":[36],"and":[37,42,74,138,187],"analysis.":[38],"However,":[39],"existing":[40,232,252],"syntax-based":[41],"deep":[43],"learning-based":[44],"parsers":[45,52,91,223,234,254],"struggle":[46],"with":[47,80,191],"complex":[48],"real-world":[49],"logs.":[50,208],"Recent":[51],"based":[53,256],"on":[54,66,94,206,211,257],"large":[55],"language":[56],"models":[57],"(LLMs)":[58],"achieve":[59],"higher":[60],"accuracy,":[61],"but":[62],"they":[63],"typically":[64],"rely":[65],"online":[67],"APIs":[68],"(e.g.,":[69],"ChatGPT),":[70,258],"raising":[71],"privacy":[72,266],"concerns":[73],"suffering":[75],"network":[77],"latency.":[78],"Moreover,":[79,228],"rise":[82],"artificial":[84],"intelligence":[85],"IT":[87],"operations":[88],"(AIOps),":[89],"traditional":[90],"that":[92,121,216],"focus":[93],"syntax-level":[95],"templates":[96],"fail":[97],"capture":[99],"semantics":[101],"dynamic":[103],"parameters,":[105],"limiting":[106],"their":[107,159],"usefulness":[108],"downstream":[110],"tasks.":[111],"These":[112],"challenges":[113],"highlight":[114],"need":[116],"semantic":[118,140,181,192,240],"goes":[122],"beyond":[123],"template":[124,186],"extraction":[125,189],"understand":[127],"parameter":[128,188],"semantics.":[129],"<p":[130],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[131],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">This":[132],"paper":[133],"presents":[134],"SemanticLog,":[135],"an":[136],"effective":[137],"efficient":[139],"parser":[142],"powered":[143],"by":[144],"open-source":[145,248],"LLMs.":[146],"SemanticLog":[147,198,217,244],"adapts":[148],"structure":[150],"LLMs":[152,249],"task,":[157],"leveraging":[158],"rich":[160],"knowledge":[161],"while":[162,237,259],"safeguarding":[163],"privacy.":[166],"It":[167],"first":[168],"extracts":[169],"informative":[170],"feature":[171],"representations":[172],"data,":[175],"then":[176],"refines":[177],"them":[178],"through":[179],"fine-grained":[180],"perception":[182],"enable":[184],"accurate":[185],"together":[190],"category":[193],"prediction.":[194],"To":[195],"boost":[196],"scalability,":[197],"introduces":[199],"EffiParsing":[201],"tree":[202],"faster":[204],"inference":[205],"Extensive":[209],"experiments":[210],"LogHub-2.0":[213],"dataset":[214],"show":[215],"significantly":[218],"outperforms":[219],"state-of-the-art":[221],"in":[224,235],"terms":[225],"accuracy.":[227],"it":[229],"also":[230],"surpasses":[231],"LLM-based":[233,253],"efficiency":[236],"showcasing":[238],"advanced":[239],"capability.":[242],"Notably,":[243],"employs":[245],"much":[246],"smaller":[247],"compared":[250],"(mainly":[255],"maintaining":[260],"better":[261],"capability":[262],"protection.":[267]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-28T00:00:00"}
