{"id":"https://openalex.org/W2396252828","doi":"https://doi.org/10.21437/interspeech.2011-278","title":"Speech indexing using semantic context inference","display_name":"Speech indexing using semantic context inference","publication_year":2011,"publication_date":"2011-08-27","ids":{"openalex":"https://openalex.org/W2396252828","doi":"https://doi.org/10.21437/interspeech.2011-278","mag":"2396252828"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2011-278","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2011-278","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2011","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111774464","display_name":"Chien-Lin Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chien-Lin Huang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100749735","display_name":"Bin Ma","orcid":"https://orcid.org/0000-0002-9223-9654"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bin Ma","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032690182","display_name":"Haizhou Li","orcid":"https://orcid.org/0000-0001-9158-9401"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Haizhou Li","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5103251327","display_name":"Chung\u2010Hsien Wu","orcid":"https://orcid.org/0000-0002-3947-2123"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chung-Hsien Wu","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5111774464"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.1691,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.89691838,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"717","last_page":"720"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.992900013923645,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.84880131483078},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.621903121471405},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6138434410095215},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.6124115586280823},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5741482973098755},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5480039119720459},{"id":"https://openalex.org/keywords/document-retrieval","display_name":"Document retrieval","score":0.4854632019996643},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.47618284821510315},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.42836907505989075}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.84880131483078},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.621903121471405},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6138434410095215},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.6124115586280823},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5741482973098755},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5480039119720459},{"id":"https://openalex.org/C161156560","wikidata":"https://www.wikidata.org/wiki/Q1638872","display_name":"Document retrieval","level":2,"score":0.4854632019996643},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.47618284821510315},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.42836907505989075},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/interspeech.2011-278","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2011-278","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2011","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.7699999809265137}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W8882349","https://openalex.org/W2095368471","https://openalex.org/W2102261232","https://openalex.org/W2104212264","https://openalex.org/W2107743791","https://openalex.org/W2125595375","https://openalex.org/W2127923419","https://openalex.org/W2136440675","https://openalex.org/W2136542423","https://openalex.org/W2138451337","https://openalex.org/W2146229144","https://openalex.org/W2147152072","https://openalex.org/W2148986421","https://openalex.org/W2150857077","https://openalex.org/W2151742940","https://openalex.org/W2162439664"],"related_works":["https://openalex.org/W3024364549","https://openalex.org/W4206019083","https://openalex.org/W2048865712","https://openalex.org/W1976265003","https://openalex.org/W2370378377","https://openalex.org/W4237510188","https://openalex.org/W2130160813","https://openalex.org/W2389273994","https://openalex.org/W2188505374","https://openalex.org/W2028546017"],"abstract_inverted_index":{"Abstract":[0],"This":[1],"study":[2],"presents":[3],"a":[4,23,29,34,40,61,73,113,277,286],"novel":[5],"approach":[6,380],"to":[7,112,206,217,232,282,285,313,360],"spoken":[8,24,118,129,150,192,225,242,308,336,392],"document":[9,25,119,130,151,243,278,309,337],"retrieval":[10,131,152,238,244,302],"based":[11],"on":[12,83,202,271],"semantic":[13,30,37,41,45,57,62,69,108,126,345],"context":[14,46,70,109,127],"inference":[15,31,47,58,71,110],"for":[16,76,140,255,335],"speech":[17,77,104,124,221,253,315,387],"indexing.":[18,78,256,354],"Each":[19],"recognized":[20],"term":[21,63],"in":[22,153,227,307,322,351],"is":[26,49,135,214,279],"mapped":[27],"onto":[28],"vector":[32,48,72],"containing":[33],"bag":[35],"of":[36,94,117,143,149,178,182,199,293,299,396],"terms":[38],"through":[39],"relation":[42],"matrix.":[43],"The":[44,79,97,147,161,296,339,376],"then":[50],"constructed":[51],"by":[52],"summing":[53],"up":[54],"all":[55],"the":[56,68,102,107,136,141,176,204,220,224,228,240,248,320,386,397,405],"vectors.":[59],"Such":[60],"expansion":[64],"and":[65,145,156,175,186,236,261,319,324,346,373,394],"re-weighting":[66],"make":[67],"suitable":[74],"representation":[75],"experiments":[80],"were":[81],"conducted":[82],"1550":[84],"anchor":[85],"news":[86,93,184],"stories":[87],"collected":[88],"from":[89,251,391],"Mandarin":[90],"Chinese":[91],"broadcast":[92],"198":[95],"hours.":[96],"experimental":[98],"results":[99],"indicate":[100],"that":[101,212,275],"proposed":[103,359],"indexing":[105,297,329,366,379],"using":[106],"contributes":[111],"substantial":[114],"performance":[115],"improvement":[116],"retrieval.":[120,310,338],"Index":[121],"Terms":[122],":":[123],"indexing,":[125],"inference,":[128],"1.":[132],"Introduction":[133],"Speech":[134],"most":[137],"convenient":[138],"way":[139],"interaction":[142],"human-to-human":[144],"human-to-machine.":[146],"applications":[148],"education,":[154],"business":[155],"entertainment":[157],"are":[158,331],"rapidly":[159],"growing.":[160],"recent":[162],"attempts":[163],"include":[164],"multilingual":[165],"oral":[166],"history":[167],"archives":[168],"access":[169],"[1],":[170],"MIT":[171],"lecture":[172],"browsing":[173],"[2],":[174],"management":[177],"National":[179],"Gallery":[180],"consisting":[181],"speeches,":[183],"broadcasts":[185],"recordings":[187],"[3],":[188],"voice":[189],"search":[190],"about":[191],"dialog,":[193],"call-routing":[194],"systems":[195],"[4],":[196],"etc.":[197],"All":[198],"them":[200],"focus":[201],"retrieving":[203],"information":[205,301,383],"meet":[207],"users'":[208],"requirements.":[209],"We":[210],"know":[211],"it":[213,289],"not":[215,332],"straightforward":[216],"directly":[218],"compare":[219],"query":[222,287,294],"with":[223,364],"documents":[226],"database.":[229],"In":[230],"order":[231],"construct":[233],"an":[234,352],"efficient":[235],"effective":[237],"system,":[239],"state-of-the-art":[241],"(SDR)":[245],"technologies":[246],"adopt":[247],"transcription":[249,340],"obtained":[250],"automatic":[252],"recognition":[254,316],"Vector":[257],"space":[258],"model":[259],"[5]":[260],"probabilistic":[262],"models":[263],"(HMM":[264],"[6],":[265],"GMM":[266],"[7],":[267],"KL-divergence":[268],"[8]),":[269],"rely":[270],"certain":[272],"similarity":[273],"functions":[274],"assume":[276],"more":[280,291],"likely":[281],"be":[283],"relevant":[284],"if":[288],"contains":[290],"occurrences":[292],"terms.":[295],"techniques":[298,330],"text-based":[300,328],"have":[303,357],"been":[304,358],"widely":[305],"adopted":[306],"However,":[311],"due":[312],"imperfect":[314],"results,":[317],"out-of-vocabulary,":[318],"ambiguity":[321],"homophone":[323],"word":[325],"tokenization,":[326],"conventional":[327],"always":[333],"appropriate":[334],"errors":[341],"may":[342],"cause":[343],"undesired":[344],"syntactic":[347],"expression,":[348],"thus":[349],"result":[350],"inadequate":[353],"Several":[355],"approaches":[356],"address":[361],"these":[362],"problems":[363],"various":[365],"units":[367],"such":[368],"as":[369],"word,":[370],"sub-word,":[371],"phone,":[372],"so":[374],"on.":[375],"multi-level":[377],"knowledge":[378],"considers":[381],"three":[382],"sources":[384],"including":[385],"transcription,":[388],"keywords":[389,399],"extracted":[390,398],"documents,":[393],"hypernyms":[395],"[9].":[400],"Hui":[401],"et":[402],"al.":[403],"applied":[404]},"counts_by_year":[{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":5},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":2},{"year":2013,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
