{"id":"https://openalex.org/W7154715737","doi":"https://doi.org/10.48550/arxiv.2604.14531","title":"TRACER: Trace-Based Adaptive Cost-Efficient Routing for LLM Classification","display_name":"TRACER: Trace-Based Adaptive Cost-Efficient Routing for LLM Classification","publication_year":2026,"publication_date":"2026-04-16","ids":{"openalex":"https://openalex.org/W7154715737","doi":"https://doi.org/10.48550/arxiv.2604.14531"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.14531","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.14531","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.14531","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5021098005","display_name":"Adam Rida","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Rida, Adam","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5021098005"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.24009999632835388,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.24009999632835388,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.10760000348091125,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.061900001019239426,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.6955999732017517},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6033999919891357},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.43149998784065247},{"id":"https://openalex.org/keywords/smoothing","display_name":"Smoothing","score":0.41350001096725464},{"id":"https://openalex.org/keywords/routing","display_name":"Routing (electronic design automation)","score":0.3626999855041504},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.3497999906539917},{"id":"https://openalex.org/keywords/surrogate-data","display_name":"Surrogate data","score":0.3467999994754791}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.6955999732017517},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6638000011444092},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6033999919891357},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.43149998784065247},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42419999837875366},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4169999957084656},{"id":"https://openalex.org/C3770464","wikidata":"https://www.wikidata.org/wiki/Q775963","display_name":"Smoothing","level":2,"score":0.41350001096725464},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3937000036239624},{"id":"https://openalex.org/C74172769","wikidata":"https://www.wikidata.org/wiki/Q1446839","display_name":"Routing (electronic design automation)","level":2,"score":0.3626999855041504},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.3497999906539917},{"id":"https://openalex.org/C142806159","wikidata":"https://www.wikidata.org/wiki/Q7646876","display_name":"Surrogate data","level":3,"score":0.3467999994754791},{"id":"https://openalex.org/C147494362","wikidata":"https://www.wikidata.org/wiki/Q2078905","display_name":"Troubleshooting","level":2,"score":0.3382999897003174},{"id":"https://openalex.org/C131675550","wikidata":"https://www.wikidata.org/wiki/Q7646884","display_name":"Surrogate model","level":2,"score":0.3325999975204468},{"id":"https://openalex.org/C62354387","wikidata":"https://www.wikidata.org/wiki/Q875399","display_name":"Boundary (topology)","level":2,"score":0.32760000228881836},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3167000114917755},{"id":"https://openalex.org/C134261354","wikidata":"https://www.wikidata.org/wiki/Q938438","display_name":"Statistical inference","level":2,"score":0.30799999833106995},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3021000027656555},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.2915000021457672},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.28870001435279846},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.27630001306533813},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.25049999356269836}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.14531","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.14531","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.14531","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.14531","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Every":[0],"call":[1],"to":[2,54],"an":[3,76,84],"LLM":[4,106],"classification":[5],"endpoint":[6],"produces":[7],"a":[8,20,25,33,93,108,137,142,158,168],"labeled":[9],"input-output":[10],"pair":[11],"already":[12],"retained":[13],"in":[14],"production":[15,87],"logs.":[16],"These":[17],"pairs":[18],"constitute":[19],"free,":[21],"growing":[22],"training":[23],"set:":[24],"lightweight":[26],"surrogate":[27,50,97,127,149,162],"trained":[28],"on":[29,83,152,157],"them":[30],"can":[31],"absorb":[32],"significant":[34],"portion":[35],"of":[36],"future":[37],"traffic":[38],"at":[39],"near-zero":[40],"marginal":[41],"inference":[42,171],"cost.":[43],"The":[44,187],"open":[45],"questions":[46],"are":[47],"when":[48,101],"the":[49,96,105,114,126,153,161,165,173,180],"is":[51,98,189],"reliable":[52,185],"enough":[53],"deploy,":[55],"what":[56],"it":[57,130,134],"handles":[58],"versus":[59],"defers,":[60],"and":[61,89,132],"how":[62],"that":[63,79],"boundary":[64,116],"evolves":[65],"as":[66,191],"data":[67],"accumulates.":[68],"We":[69],"introduce":[70],"TRACER":[71,118,146],"(Trace-based":[72],"Adaptive":[73],"Cost-Efficient":[74],"Routing),":[75],"open-source":[77,192],"system":[78,188],"trains":[80],"ML":[81],"surrogates":[82],"LLM's":[85],"own":[86],"traces":[88],"governs":[90],"deployment":[91,178],"through":[92],"parity":[94,174],"gate:":[95],"activated":[99],"only":[100],"its":[102],"agreement":[103],"with":[104,141],"exceeds":[107],"user-specified":[109],"threshold":[110],"\u03b1.":[111],"To":[112],"make":[113],"routing":[115],"transparent,":[117],"generates":[119],"interpretability":[120],"artifacts":[121],"describing":[122],"which":[123],"input":[124],"regions":[125],"handles,":[128],"where":[129],"plateaus,":[131],"why":[133],"defers.":[135],"On":[136,167],"77-class":[138],"intent":[139],"benchmark":[140],"Sonnet":[143],"4.6":[144],"teacher,":[145],"achieves":[147],"83-100%":[148],"coverage":[150],"depending":[151],"quality":[154],"target":[155],"\u03b1;":[156],"150-class":[159],"benchmark,":[160],"fully":[163],"replaces":[164],"teacher.":[166],"natural":[169],"language":[170],"task,":[172],"gate":[175],"correctly":[176],"refuses":[177],"because":[179],"embedding":[181],"representation":[182],"cannot":[183],"support":[184],"separation.":[186],"available":[190],"software.":[193]},"counts_by_year":[],"updated_date":"2026-04-18T06:05:20.339008","created_date":"2026-04-18T00:00:00"}
