{"id":"https://openalex.org/W2083524281","doi":"https://doi.org/10.1109/icassp.2013.6639339","title":"Sparse lexical representation for semantic entity resolution","display_name":"Sparse lexical representation for semantic entity resolution","publication_year":2013,"publication_date":"2013-05-01","ids":{"openalex":"https://openalex.org/W2083524281","doi":"https://doi.org/10.1109/icassp.2013.6639339","mag":"2083524281"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2013.6639339","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2013.6639339","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE International Conference on Acoustics, Speech and Signal Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054207254","display_name":"Yuzhe Jin","orcid":null},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yuzhe Jin","raw_affiliation_strings":["Microsoft Research, Redmond, USA","[Microsoft Research,Redmond,WA,USA]"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"[Microsoft Research,Redmond,WA,USA]","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041659067","display_name":"Kuansan Wang","orcid":"https://orcid.org/0000-0001-7089-7966"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kuansan Wang","raw_affiliation_strings":["Microsoft Research, Redmond, USA","[Microsoft Research,Redmond,WA,USA]"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"[Microsoft Research,Redmond,WA,USA]","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5079458476","display_name":"Emre K\u0131c\u0131man","orcid":"https://orcid.org/0000-0001-5429-468X"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Emre Kiciman","raw_affiliation_strings":["Microsoft Research, Redmond, USA","[Microsoft Research,Redmond,WA,USA]"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"[Microsoft Research,Redmond,WA,USA]","institution_ids":["https://openalex.org/I1290206253"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5054207254"],"corresponding_institution_ids":["https://openalex.org/I1290206253"],"apc_list":null,"apc_paid":null,"fwci":0.4809,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.76499788,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"1","issue":null,"first_page":"8575","last_page":"8579"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11819","display_name":"Data-Driven Disease Surveillance","score":0.9860000014305115,"subfield":{"id":"https://openalex.org/subfields/2713","display_name":"Epidemiology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8103529214859009},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6421027183532715},{"id":"https://openalex.org/keywords/salient","display_name":"Salient","score":0.6022224426269531},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.5602601766586304},{"id":"https://openalex.org/keywords/sparse-approximation","display_name":"Sparse approximation","score":0.5293520092964172},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.52070552110672},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.43124452233314514},{"id":"https://openalex.org/keywords/knowledge-base","display_name":"Knowledge base","score":0.42121654748916626},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3918442726135254},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.35886150598526}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8103529214859009},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6421027183532715},{"id":"https://openalex.org/C2780719617","wikidata":"https://www.wikidata.org/wiki/Q1030752","display_name":"Salient","level":2,"score":0.6022224426269531},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.5602601766586304},{"id":"https://openalex.org/C124066611","wikidata":"https://www.wikidata.org/wiki/Q28684319","display_name":"Sparse approximation","level":2,"score":0.5293520092964172},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.52070552110672},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.43124452233314514},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.42121654748916626},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3918442726135254},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.35886150598526},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C111368507","wikidata":"https://www.wikidata.org/wiki/Q43518","display_name":"Oceanography","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp.2013.6639339","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2013.6639339","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE International Conference on Acoustics, Speech and Signal Processing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":54,"referenced_works":["https://openalex.org/W11298561","https://openalex.org/W86887328","https://openalex.org/W1548663377","https://openalex.org/W1557103245","https://openalex.org/W1592871157","https://openalex.org/W1594128868","https://openalex.org/W1984568490","https://openalex.org/W2014896416","https://openalex.org/W2045887127","https://openalex.org/W2078204800","https://openalex.org/W2099464104","https://openalex.org/W2100341149","https://openalex.org/W2107628405","https://openalex.org/W2109449402","https://openalex.org/W2112941141","https://openalex.org/W2116148865","https://openalex.org/W2120480077","https://openalex.org/W2128092100","https://openalex.org/W2128659236","https://openalex.org/W2129812935","https://openalex.org/W2131357087","https://openalex.org/W2134237567","https://openalex.org/W2134517373","https://openalex.org/W2135046866","https://openalex.org/W2137012645","https://openalex.org/W2150761663","https://openalex.org/W2151693816","https://openalex.org/W2153636395","https://openalex.org/W2158195707","https://openalex.org/W2162638401","https://openalex.org/W2253807446","https://openalex.org/W2294690908","https://openalex.org/W2296616510","https://openalex.org/W2408607167","https://openalex.org/W2500358397","https://openalex.org/W2950186769","https://openalex.org/W2950789693","https://openalex.org/W3022380717","https://openalex.org/W4213009331","https://openalex.org/W4233559841","https://openalex.org/W4250955649","https://openalex.org/W4254240410","https://openalex.org/W6600479677","https://openalex.org/W6603544577","https://openalex.org/W6632852411","https://openalex.org/W6633578333","https://openalex.org/W6635311266","https://openalex.org/W6635490881","https://openalex.org/W6676702705","https://openalex.org/W6678242812","https://openalex.org/W6682469966","https://openalex.org/W6683847725","https://openalex.org/W6820645939","https://openalex.org/W6988049230"],"related_works":["https://openalex.org/W2383111961","https://openalex.org/W2365952365","https://openalex.org/W2352448290","https://openalex.org/W2380820513","https://openalex.org/W2913146933","https://openalex.org/W2372385138","https://openalex.org/W4296359239","https://openalex.org/W2329500892","https://openalex.org/W2101155126","https://openalex.org/W2043093291"],"abstract_inverted_index":{"This":[0],"paper":[1],"addresses":[2],"the":[3,19,43,46,61,75,85,94,98,106,112,128,134,150,154,170],"problem":[4],"of":[5,18,45,51,77,142,172],"semantic":[6,47],"entity":[7],"resolution":[8,44],"(SER),":[9],"which":[10,39],"aims":[11],"to":[12,42,56,83,103],"determine":[13],"whether":[14],"some":[15],"or":[16],"none":[17],"entities":[20,48],"in":[21,27,60,176],"a":[22,28,52,138],"knowledge":[23,139],"base":[24,140],"is":[25],"mentioned":[26],"given":[29],"web":[30,62,178],"document.":[31],"The":[32],"lexical":[33,58,88,108],"features,":[34],"e.g.,":[35],"words":[36],"and":[37,64],"phrases,":[38],"are":[40,49,81],"critical":[41],"typically":[50],"small":[53],"amount":[54],"compared":[55],"all":[57,105],"features":[59,109,123],"document,":[63],"therefore":[65],"can":[66],"be":[67],"modeled":[68],"as":[69,133],"sparse":[70,78,173],"signals.":[71],"Two":[72],"techniques":[73,152,175],"leveraging":[74],"principles":[76],"signal":[79,174],"recovery":[80],"proposed":[82,151],"identify":[84],"sparse,":[86],"salient":[87,107,122],"features:":[89],"one":[90,124,126],"technique,":[91,114],"based":[92],"on":[93],"Lasso":[95],"algorithm":[96],"with":[97],"l2-norm":[99],"distance":[100,135],"metric,":[101],"attempts":[102],"recover":[104],"at":[110],"once;":[111],"other":[113],"namely":[115],"Posterior":[116],"Probability":[117],"Pursuit":[118],"(PPP),":[119],"sequentially":[120],"identifies":[121],"after":[125],"using":[127],"negative":[129],"log":[130],"posterior":[131],"probability":[132],"metric.":[136],"Using":[137],"consisting":[141],"about":[143],"100":[144],"million":[145],"entities,":[146],"we":[147],"show":[148],"that":[149],"exploiting":[153],"sparsity":[155,167],"nature":[156],"underlying":[157],"SER":[158],"deliver":[159],"substantial":[160],"performance":[161],"improvement":[162],"over":[163],"baseline":[164],"methods":[165],"without":[166],"consideration,":[168],"demonstrating":[169],"potentials":[171],"entity-centric":[177],"information":[179],"processing.":[180]},"counts_by_year":[{"year":2016,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
