{"id":"https://openalex.org/W7155053804","doi":"https://doi.org/10.48550/arxiv.2604.16810","title":"Gleaner: A Semantically-Rich and Efficient Online Sampler for Microservice Diagnostics","display_name":"Gleaner: A Semantically-Rich and Efficient Online Sampler for Microservice Diagnostics","publication_year":2026,"publication_date":"2026-04-18","ids":{"openalex":"https://openalex.org/W7155053804","doi":"https://doi.org/10.48550/arxiv.2604.16810"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.16810","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.16810","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.16810","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000074603","display_name":"Yi Yang","orcid":"https://orcid.org/0000-0002-4091-8532"},"institutions":[{"id":"https://openalex.org/I4210116924","display_name":"Chinese University of Hong Kong, Shenzhen","ror":"https://ror.org/02d5ks197","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633","https://openalex.org/I180726961","https://openalex.org/I4210116924"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang, Yifan","raw_affiliation_strings":["The Chinese University of Hong Kong, Shenzhen"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong, Shenzhen","institution_ids":["https://openalex.org/I4210116924"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102890900","display_name":"Aoyang Fang","orcid":"https://orcid.org/0009-0006-7116-5613"},"institutions":[{"id":"https://openalex.org/I4210116924","display_name":"Chinese University of Hong Kong, Shenzhen","ror":"https://ror.org/02d5ks197","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633","https://openalex.org/I180726961","https://openalex.org/I4210116924"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"FANG, Aoyang","raw_affiliation_strings":["The Chinese University of Hong Kong, Shenzhen"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong, Shenzhen","institution_ids":["https://openalex.org/I4210116924"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040008769","display_name":"Songhan Zhang","orcid":"https://orcid.org/0009-0009-0289-0338"},"institutions":[{"id":"https://openalex.org/I4210116924","display_name":"Chinese University of Hong Kong, Shenzhen","ror":"https://ror.org/02d5ks197","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633","https://openalex.org/I180726961","https://openalex.org/I4210116924"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhang, Songhan","raw_affiliation_strings":["The Chinese University of Hong Kong, Shenzhen"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong, Shenzhen","institution_ids":["https://openalex.org/I4210116924"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5134126617","display_name":"Pinjia He","orcid":null},"institutions":[{"id":"https://openalex.org/I4210116924","display_name":"Chinese University of Hong Kong, Shenzhen","ror":"https://ror.org/02d5ks197","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633","https://openalex.org/I180726961","https://openalex.org/I4210116924"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"He, Pinjia","raw_affiliation_strings":["The Chinese University of Hong Kong, Shenzhen"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong, Shenzhen","institution_ids":["https://openalex.org/I4210116924"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I4210116924"],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.9872999787330627,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.9872999787330627,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.0013000000035390258,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.0010999999940395355,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.7840999960899353},{"id":"https://openalex.org/keywords/tracing","display_name":"Tracing","score":0.6894000172615051},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5321999788284302},{"id":"https://openalex.org/keywords/trace","display_name":"TRACE (psycholinguistics)","score":0.5001999735832214},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.49729999899864197},{"id":"https://openalex.org/keywords/microservices","display_name":"Microservices","score":0.4950999915599823},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.46810001134872437},{"id":"https://openalex.org/keywords/multigraph","display_name":"Multigraph","score":0.4456000030040741}],"concepts":[{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.7840999960899353},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7785000205039978},{"id":"https://openalex.org/C138673069","wikidata":"https://www.wikidata.org/wiki/Q322229","display_name":"Tracing","level":2,"score":0.6894000172615051},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5698999762535095},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5321999788284302},{"id":"https://openalex.org/C75291252","wikidata":"https://www.wikidata.org/wiki/Q1315756","display_name":"TRACE (psycholinguistics)","level":2,"score":0.5001999735832214},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.49729999899864197},{"id":"https://openalex.org/C2778505942","wikidata":"https://www.wikidata.org/wiki/Q18344624","display_name":"Microservices","level":3,"score":0.4950999915599823},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.46810001134872437},{"id":"https://openalex.org/C17758045","wikidata":"https://www.wikidata.org/wiki/Q2642629","display_name":"Multigraph","level":3,"score":0.4456000030040741},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.4041000008583069},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.3991999924182892},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.37790000438690186},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3702999949455261},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.3621000051498413},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.3034000098705292},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2935999929904938},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.28769999742507935},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.28290000557899475},{"id":"https://openalex.org/C113954288","wikidata":"https://www.wikidata.org/wiki/Q186885","display_name":"Timestamp","level":2,"score":0.27869999408721924},{"id":"https://openalex.org/C130963320","wikidata":"https://www.wikidata.org/wiki/Q1401207","display_name":"Root cause analysis","level":2,"score":0.27630001306533813},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.2540999948978424},{"id":"https://openalex.org/C196921405","wikidata":"https://www.wikidata.org/wiki/Q786431","display_name":"Online algorithm","level":2,"score":0.250900000333786},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.25029999017715454}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.16810","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.16810","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.16810","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.16810","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Distributed":[0],"tracing":[1],"in":[2,50],"microservices":[3],"is":[4,68,173],"critical":[5],"for":[6,80,121,198],"diagnostics":[7],"but":[8],"generates":[9],"overwhelming":[10],"data":[11,172,189],"volumes,":[12],"necessitating":[13],"intelligent":[14,185],"sampling.":[15],"To":[16,53],"maximize":[17],"fidelity,":[18],"state-of-the-art":[19],"(SOTA)":[20],"tail-based":[21],"samplers":[22],"analyze":[23],"complete":[24],"(or":[25],"even":[26],"log-enriched)":[27],"traces":[28,120,130],"by":[29,138,145,161],"modeling":[30],"them":[31],"as":[32,89],"graphs.":[33],"However,":[34],"this":[35,54,65],"reliance":[36],"on":[37,70,169],"computationally":[38],"expensive":[39],"graph":[40,76,98],"analysis":[41],"creates":[42],"a":[43,90,112,153,188,193],"performance":[44],"bottleneck":[45],"that":[46,63,74],"prohibits":[47],"their":[48],"use":[49],"online":[51,60],"settings.":[52],"end,":[55],"we":[56],"propose":[57],"Gleaner,":[58],"an":[59,108],"tail-sampling":[61],"framework":[62],"breaks":[64],"trade-off.":[66],"It":[67,105],"founded":[69],"the":[71,164,178],"key":[72],"insight":[73],"explicit":[75],"structures":[77],"are":[78],"unnecessary":[79],"high-fidelity":[81],"trace":[82,88],"grouping.":[83],"Instead,":[84],"Gleaner":[85,128,157],"represents":[86],"each":[87],"\"bag-of-edges\"":[91],"augmented":[92],"with":[93,100,177],"log":[94],"semantics,":[95],"replacing":[96],"slow":[97],"algorithms":[99],"highly":[101],"efficient":[102],"set-based":[103],"operations.":[104,200],"also":[106],"employs":[107],"alarm-driven":[109],"quota":[110],"and":[111,118,142],"diversity-preserving":[113],"strategy":[114],"to":[115,140,147,192],"prioritize":[116],"anomalous":[117],"rare":[119],"downstream":[122],"Root":[123],"Cause":[124],"Analysis":[125],"(RCA).":[126],"Experimentally,":[127],"processes":[129],"at":[131],"0.74ms":[132],"each,":[133],"improving":[134],"Trace":[135],"Pattern":[136],"Coverage":[137],"up":[139,146],"128.7%":[141],"Shannon":[143],"Entropy":[144],"32.9%":[148],"over":[149,163],"baselines.":[150],"At":[151],"just":[152],"1%":[154],"sampling":[155,186],"rate,":[156],"improves":[158],"RCA":[159,168],"accuracy":[160],"42%-107%":[162],"next-best":[165],"sampler.":[166],"Moreover,":[167],"Gleaner's":[170],"sampled":[171],"more":[174],"accurate":[175],"than":[176],"entire,":[179],"unsampled":[180],"dataset.":[181],"This":[182],"result":[183],"reframes":[184],"from":[187],"reduction":[190],"technique":[191],"powerful":[194],"signal":[195],"enhancement":[196],"paradigm":[197],"automated":[199]},"counts_by_year":[],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2026-04-22T00:00:00"}
