{"id":"https://openalex.org/W3199492011","doi":"https://doi.org/10.1145/3472749.3474771","title":"Hierarchical Summarization for Longform Spoken Dialog","display_name":"Hierarchical Summarization for Longform Spoken Dialog","publication_year":2021,"publication_date":"2021-10-10","ids":{"openalex":"https://openalex.org/W3199492011","doi":"https://doi.org/10.1145/3472749.3474771","mag":"3199492011"},"language":"en","primary_location":{"id":"doi:10.1145/3472749.3474771","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3472749.3474771","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The 34th Annual ACM Symposium on User Interface Software and Technology","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100714110","display_name":"Daniel Li","orcid":"https://orcid.org/0000-0002-7536-3418"},"institutions":[{"id":"https://openalex.org/I78577930","display_name":"Columbia University","ror":"https://ror.org/00hj8s172","country_code":"US","type":"education","lineage":["https://openalex.org/I78577930"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Daniel Li","raw_affiliation_strings":["Columbia University, United States"],"affiliations":[{"raw_affiliation_string":"Columbia University, United States","institution_ids":["https://openalex.org/I78577930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100599747","display_name":"Thomas Chen","orcid":"https://orcid.org/0000-0001-6398-093X"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Thomas Chen","raw_affiliation_strings":["Microsoft, United States"],"affiliations":[{"raw_affiliation_string":"Microsoft, United States","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005911114","display_name":"Albert Tung","orcid":"https://orcid.org/0000-0002-6129-7819"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Albert Tung","raw_affiliation_strings":["Stanford University, United States"],"affiliations":[{"raw_affiliation_string":"Stanford University, United States","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049173646","display_name":"Lydia B. Chilton","orcid":"https://orcid.org/0000-0002-1737-1276"},"institutions":[{"id":"https://openalex.org/I78577930","display_name":"Columbia University","ror":"https://ror.org/00hj8s172","country_code":"US","type":"education","lineage":["https://openalex.org/I78577930"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lydia B Chilton","raw_affiliation_strings":["Computer Science Department Columbia University, United States"],"affiliations":[{"raw_affiliation_string":"Computer Science Department Columbia University, United States","institution_ids":["https://openalex.org/I78577930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100714110"],"corresponding_institution_ids":["https://openalex.org/I78577930"],"apc_list":null,"apc_paid":null,"fwci":1.1199,"has_fulltext":false,"cited_by_count":17,"citation_normalized_percentile":{"value":0.82520715,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"582","last_page":"597"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.8971794247627258},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8856633901596069},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6277769804000854},{"id":"https://openalex.org/keywords/dialog-box","display_name":"Dialog box","score":0.5465020537376404},{"id":"https://openalex.org/keywords/spoken-language","display_name":"Spoken language","score":0.5372215509414673},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5067616105079651},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.48660290241241455},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47168901562690735},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4262961745262146},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.41648024320602417},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.1684080958366394}],"concepts":[{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.8971794247627258},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8856633901596069},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6277769804000854},{"id":"https://openalex.org/C173853756","wikidata":"https://www.wikidata.org/wiki/Q86915","display_name":"Dialog box","level":2,"score":0.5465020537376404},{"id":"https://openalex.org/C2776230583","wikidata":"https://www.wikidata.org/wiki/Q1322198","display_name":"Spoken language","level":2,"score":0.5372215509414673},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5067616105079651},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.48660290241241455},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47168901562690735},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4262961745262146},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.41648024320602417},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.1684080958366394},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3472749.3474771","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3472749.3474771","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The 34th Annual ACM Symposium on User Interface Software and Technology","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4399999976158142,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1834627372","https://openalex.org/W1973950142","https://openalex.org/W2006960950","https://openalex.org/W2045942221","https://openalex.org/W2060666149","https://openalex.org/W2061585017","https://openalex.org/W2106918957","https://openalex.org/W2123718485","https://openalex.org/W2215310981","https://openalex.org/W2505877856","https://openalex.org/W2588775355","https://openalex.org/W2808114373","https://openalex.org/W2936695845","https://openalex.org/W2941514234","https://openalex.org/W2970641574","https://openalex.org/W2977940954","https://openalex.org/W2989743967","https://openalex.org/W3034383590","https://openalex.org/W3087283451","https://openalex.org/W3089241472","https://openalex.org/W3093699630","https://openalex.org/W3093732029","https://openalex.org/W3098103528","https://openalex.org/W3099474967","https://openalex.org/W3100560913","https://openalex.org/W3125649296","https://openalex.org/W3175228675","https://openalex.org/W4241247176"],"related_works":["https://openalex.org/W2366403280","https://openalex.org/W1495108544","https://openalex.org/W2091301346","https://openalex.org/W3148229873","https://openalex.org/W4389760904","https://openalex.org/W2150160875","https://openalex.org/W4242223894","https://openalex.org/W4306886878","https://openalex.org/W2949169006","https://openalex.org/W2034361844"],"abstract_inverted_index":{"Every":[0],"day":[1],"we":[2,121,168],"are":[3,105],"surrounded":[4],"by":[5],"spoken":[6,29,89,116],"dialog.":[7],"This":[8],"medium":[9],"delivers":[10],"rich":[11],"diverse":[12],"streams":[13],"of":[14,28,67,135,172,192],"information":[15,36],"auditorily;":[16],"however,":[17],"systematically":[18],"understanding":[19,33,50],"dialog":[20],"can":[21],"often":[22],"be":[23],"non-trivial.":[24],"Despite":[25],"the":[26,73,88,173,195],"pervasiveness":[27],"dialog,":[30],"automated":[31],"speech":[32,78,95,144],"and":[34,65,86,98,112,127,131,138,154,189],"quality":[35],"extraction":[37],"remains":[38],"markedly":[39],"poor,":[40],"especially":[41],"when":[42],"compared":[43,48],"to":[44,49,82,141,151,185,194],"written":[45],"prose.":[46],"Furthermore,":[47],"text,":[51],"auditory":[52],"communication":[53],"poses":[54],"many":[55],"additional":[56],"challenges":[57],"such":[58],"as":[59,157,159,182],"speaker":[60],"disfluencies,":[61],"informal":[62],"prose":[63],"styles,":[64],"lack":[66],"structure.":[68],"These":[69],"concerns":[70],"all":[71],"demonstrate":[72],"need":[74],"for":[75,179],"a":[76,123,133,183],"distinctly":[77],"tailored":[79],"interactive":[80],"system":[81,148,174],"help":[83],"users":[84,150],"understand":[85],"navigate":[87,155],"language":[90,117],"domain.":[91],"While":[92],"individual":[93],"automatic":[94],"recognition":[96],"(ASR)":[97],"text":[99,128],"summarization":[100,129,181],"methods":[101],"already":[102],"exist,":[103],"they":[104],"imperfect":[106],"technologies;":[107],"neither":[108],"consider":[109],"user":[110,177],"purpose":[111],"intent":[113],"nor":[114],"address":[115],"induced":[118],"complications.":[119],"Consequently,":[120],"design":[122],"two":[124],"stage":[125],"ASR":[126],"pipeline":[130],"propose":[132],"set":[134],"semantic":[136],"segmentation":[137],"merging":[139],"algorithms":[140],"resolve":[142],"these":[143,164],"modeling":[145],"challenges.":[146],"Our":[147],"enables":[149],"easily":[152],"browse":[153],"content":[156,191],"well":[158],"recover":[160],"from":[161],"errors":[162],"in":[163],"underlying":[165],"technologies.":[166],"Finally,":[167],"present":[169],"an":[170],"evaluation":[171],"which":[175],"highlights":[176],"preference":[178],"hierarchical":[180],"tool":[184],"quickly":[186],"skim":[187],"audio":[188],"identify":[190],"interest":[193],"user.":[196]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":3}],"updated_date":"2026-04-13T07:58:08.660418","created_date":"2025-10-10T00:00:00"}
