{"id":"https://openalex.org/W7162686671","doi":"https://doi.org/10.48550/arxiv.2605.27441","title":"A Unified Structured Query Understanding Framework for Industrial Semantic Search","display_name":"A Unified Structured Query Understanding Framework for Industrial Semantic Search","publication_year":2026,"publication_date":"2026-05-22","ids":{"openalex":"https://openalex.org/W7162686671","doi":"https://doi.org/10.48550/arxiv.2605.27441"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.27441","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27441","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.27441","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137196492","display_name":"Ping Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Ping","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013032251","display_name":"Qianqi Shen","orcid":"https://orcid.org/0000-0002-9323-6404"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Qianqi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137232657","display_name":"Jianqiang Shen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Jianqiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132903020","display_name":"Chunnan Yao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yao, Chunnan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065398158","display_name":"Kevin Kao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kao, Kevin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137212186","display_name":"Rajat Arora","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Arora, Rajat","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137257424","display_name":"Dan Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Dan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109449817","display_name":"Baofen Zheng","orcid":"https://orcid.org/0009-0001-7494-2899"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Baofen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137282306","display_name":"Yunxiang Ren","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ren, Yunxiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137284157","display_name":"Benjamin Le","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Le, Benjamin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011520457","display_name":"Ali Hooshmand","orcid":"https://orcid.org/0009-0006-1846-2344"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hooshmand, Ali","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137280279","display_name":"Igor Lapchuk","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lapchuk, Igor","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125579143","display_name":"Juan Bottaro","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bottaro, Juan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137297340","display_name":"Raghavan Muthuregunathan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Muthuregunathan, Raghavan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137244250","display_name":"Caleb Johnson","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Johnson, Caleb","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137203220","display_name":"Liangjie Hong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hong, Liangjie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137245723","display_name":"Jingwei Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Jingwei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5137266521","display_name":"Wenjing Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Wenjing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":18,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.6079999804496765,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.6079999804496765,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.09489999711513519,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.06159999966621399,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6492000222206116},{"id":"https://openalex.org/keywords/query-language","display_name":"Query language","score":0.6051999926567078},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.590499997138977},{"id":"https://openalex.org/keywords/query-optimization","display_name":"Query optimization","score":0.527400016784668},{"id":"https://openalex.org/keywords/query-expansion","display_name":"Query expansion","score":0.5054000020027161},{"id":"https://openalex.org/keywords/web-query-classification","display_name":"Web query classification","score":0.4650999903678894},{"id":"https://openalex.org/keywords/web-search-query","display_name":"Web search query","score":0.45210000872612},{"id":"https://openalex.org/keywords/sargable","display_name":"Sargable","score":0.43799999356269836},{"id":"https://openalex.org/keywords/extensibility","display_name":"Extensibility","score":0.4034999907016754},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.3959999978542328}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8569999933242798},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6492000222206116},{"id":"https://openalex.org/C192028432","wikidata":"https://www.wikidata.org/wiki/Q845739","display_name":"Query language","level":2,"score":0.6051999926567078},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.590499997138977},{"id":"https://openalex.org/C157692150","wikidata":"https://www.wikidata.org/wiki/Q2919848","display_name":"Query optimization","level":2,"score":0.527400016784668},{"id":"https://openalex.org/C99016210","wikidata":"https://www.wikidata.org/wiki/Q5488129","display_name":"Query expansion","level":2,"score":0.5054000020027161},{"id":"https://openalex.org/C118689300","wikidata":"https://www.wikidata.org/wiki/Q7978614","display_name":"Web query classification","level":4,"score":0.4650999903678894},{"id":"https://openalex.org/C164120249","wikidata":"https://www.wikidata.org/wiki/Q995982","display_name":"Web search query","level":3,"score":0.45210000872612},{"id":"https://openalex.org/C192939062","wikidata":"https://www.wikidata.org/wiki/Q104840822","display_name":"Sargable","level":4,"score":0.43799999356269836},{"id":"https://openalex.org/C32833848","wikidata":"https://www.wikidata.org/wiki/Q4115054","display_name":"Extensibility","level":2,"score":0.4034999907016754},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.3959999978542328},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3813999891281128},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.3240000009536743},{"id":"https://openalex.org/C157154645","wikidata":"https://www.wikidata.org/wiki/Q7441612","display_name":"Search-oriented architecture","level":5,"score":0.32100000977516174},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.3208000063896179},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.31209999322891235},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3100999891757965},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.30390000343322754},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.29919999837875366},{"id":"https://openalex.org/C96956885","wikidata":"https://www.wikidata.org/wiki/Q6138701","display_name":"RDF query language","level":5,"score":0.289900004863739},{"id":"https://openalex.org/C98025372","wikidata":"https://www.wikidata.org/wiki/Q477538","display_name":"Systems architecture","level":3,"score":0.2881999909877777},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.2854999899864197},{"id":"https://openalex.org/C2779729312","wikidata":"https://www.wikidata.org/wiki/Q784232","display_name":"Query plan","level":5,"score":0.2791999876499176},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.2680000066757202},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.26739999651908875},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.26600000262260437},{"id":"https://openalex.org/C24028149","wikidata":"https://www.wikidata.org/wiki/Q7094056","display_name":"Online aggregation","level":5,"score":0.2578999996185303},{"id":"https://openalex.org/C47487241","wikidata":"https://www.wikidata.org/wiki/Q5227230","display_name":"Data access","level":2,"score":0.2572999894618988},{"id":"https://openalex.org/C2778816267","wikidata":"https://www.wikidata.org/wiki/Q21015578","display_name":"Semantic query","level":4,"score":0.2547999918460846},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.25450000166893005},{"id":"https://openalex.org/C2779585090","wikidata":"https://www.wikidata.org/wiki/Q3457762","display_name":"Resilience (materials science)","level":2,"score":0.2540000081062317}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.27441","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27441","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.27441","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27441","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/8","score":0.4193531274795532,"display_name":"Decent work and economic growth"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Query":[0,76],"understanding":[1,47],"in":[2,29,71],"large-scale":[3],"industrial":[4],"search":[5],"systems":[6],"is":[7],"typically":[8],"implemented":[9],"as":[10],"a":[11,43,55,78,84,94,128],"cascade":[12],"of":[13],"disparate,":[14],"task-specific":[15],"components.":[16],"While":[17],"individually":[18],"optimizable,":[19],"this":[20,37,107],"fragmented":[21],"architecture":[22],"incurs":[23],"high":[24],"maintenance":[25],"overhead":[26],"and":[27,41,90,92,112,141],"results":[28,136],"inconsistent":[30],"behaviors,":[31],"particularly":[32],"for":[33,87,97],"long-tail":[34],"queries.":[35],"In":[36],"work,":[38],"we":[39,74,121],"propose":[40],"deploy":[42],"unified":[44,72],"structured":[45],"query":[46],"system":[48],"that":[49,61],"consolidates":[50],"these":[51],"heterogeneous":[52],"functions":[53],"into":[54],"single":[56],"Small":[57],"Language":[58],"Model":[59],"(SLM)":[60],"performs":[62],"schema-constrained":[63],"generation.":[64],"To":[65],"address":[66],"the":[67,123],"data":[68],"bottlenecks":[69],"inherent":[70],"modeling,":[73],"introduce":[75],"Illuminator,":[77],"dual-purpose":[79],"framework":[80],"serving":[81,150],"as:":[82],"(i)":[83],"teacher":[85],"model":[86],"high-quality":[88],"auto-annotation":[89],"distillation,":[91],"(ii)":[93],"surrogate":[95],"judge":[96],"scalable":[98],"evaluation":[99],"where":[100],"human":[101],"labels":[102],"are":[103],"scarce.":[104],"We":[105],"validate":[106],"approach":[108],"through":[109,127],"extensive":[110],"offline":[111],"online":[113],"tests":[114],"within":[115],"LinkedIn's":[116],"Job":[117],"Search":[118],"system.":[119],"Furthermore,":[120],"demonstrate":[122],"framework's":[124],"horizontal":[125],"extensibility":[126],"cross-domain":[129],"case":[130],"study":[131],"on":[132,152],"People":[133],"Search.":[134],"The":[135],"show":[137],"improved":[138],"user":[139],"engagement":[140],"reduced":[142],"operational":[143],"costs,":[144],"achieved":[145],"while":[146],"satisfying":[147],"strict":[148],"low-latency":[149],"constraints":[151],"limited":[153],"GPU":[154],"resources.":[155]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-29T00:00:00"}
