{"id":"https://openalex.org/W2160849440","doi":"https://doi.org/10.1109/tmm.2009.2017607","title":"Text-Like Segmentation of General Audio for Content-Based Retrieval","display_name":"Text-Like Segmentation of General Audio for Content-Based Retrieval","publication_year":2009,"publication_date":"2009-04-28","ids":{"openalex":"https://openalex.org/W2160849440","doi":"https://doi.org/10.1109/tmm.2009.2017607","mag":"2160849440"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2009.2017607","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2009.2017607","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110491600","display_name":"Lie Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Lie Lu","raw_affiliation_strings":["Microsoft Research Asia, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Asia, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5037486611","display_name":"Alan Hanjali\u0107","orcid":"https://orcid.org/0000-0002-5771-2549"},"institutions":[{"id":"https://openalex.org/I98358874","display_name":"Delft University of Technology","ror":"https://ror.org/02e2c7k09","country_code":"NL","type":"education","lineage":["https://openalex.org/I98358874"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"A. Hanjalic","raw_affiliation_strings":["Department of Mediamatics, Delft University of Technnology, Delft, Netherlands"],"affiliations":[{"raw_affiliation_string":"Department of Mediamatics, Delft University of Technnology, Delft, Netherlands","institution_ids":["https://openalex.org/I98358874"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5110491600"],"corresponding_institution_ids":["https://openalex.org/I4210113369"],"apc_list":null,"apc_paid":null,"fwci":0.7049,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.71681775,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"11","issue":"4","first_page":"658","last_page":"669"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9904999732971191,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9894999861717224,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6839202642440796},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4991459846496582},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.47110775113105774},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4396982491016388},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.36940261721611023}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6839202642440796},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4991459846496582},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.47110775113105774},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4396982491016388},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.36940261721611023}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2009.2017607","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2009.2017607","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.5799999833106995,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W1482605500","https://openalex.org/W1940377967","https://openalex.org/W1985593448","https://openalex.org/W1999956262","https://openalex.org/W2077456266","https://openalex.org/W2101258687","https://openalex.org/W2113198681","https://openalex.org/W2114762973","https://openalex.org/W2119577488","https://openalex.org/W2124495245","https://openalex.org/W2126109423","https://openalex.org/W2143092130","https://openalex.org/W2149022377","https://openalex.org/W2152322845","https://openalex.org/W2156481234","https://openalex.org/W2157933833","https://openalex.org/W2161755617","https://openalex.org/W2165874743","https://openalex.org/W2542529521","https://openalex.org/W4243306052","https://openalex.org/W6628911050","https://openalex.org/W6650430342","https://openalex.org/W6684578312","https://openalex.org/W6729414129"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2478288626","https://openalex.org/W4391913857","https://openalex.org/W2350741829","https://openalex.org/W3204019825"],"abstract_inverted_index":{"Automatic":[0],"detection":[1],"of":[2,46,67,113,119,145,175,191,206,209],"(semantically)":[3],"meaningful":[4],"audio":[5,25,35,61,106,114,121,148,180,193,211,232],"segments,":[6],"or":[7],"<i":[8,11,68,71,75,78,81,136,139],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[9,12,69,72,76,79,82,137,140],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">audio</i>":[10,70,80],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">scenes</i>":[13],",":[14,84],"is":[15,108,129,169,219],"an":[16,65,105,120],"important":[17],"step":[18],"in":[19,53,96,228],"high-level":[20],"semantic":[21,158],"inference":[22],"from":[23,164],"general":[24],"signals,":[26],"and":[27,36,74,94,116,168,183,187],"can":[28,86],"benefit":[29],"various":[30],"content-based":[31],"applications":[32],"involving":[33],"both":[34],"multimodal":[37],"(multimedia)":[38],"data":[39,203,212],"sets.":[40],"Motivated":[41],"by":[42],"the":[43,92,102,117,135,146,161,176,179,184,188,192,216,223,230],"known":[44],"limitations":[45],"traditional":[47,224],"low-level":[48,225],"feature-based":[49,226],"approaches,":[50],"we":[51],"propose":[52],"this":[54],"paper":[55],"a":[56,97,111,125,173,201],"novel":[57],"approach":[58,218],"to":[59,91],"discover":[60],"scenes,":[62],"based":[63,131],"on":[64,132,200],"analysis":[66],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">elements</i>":[73,83],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">key</i>":[77],"which":[85],"be":[87],"seen":[88,109],"as":[89,110,172],"equivalents":[90],"words":[93],"keywords":[95],"text":[98,165],"document,":[99],"respectively.":[100],"In":[101],"proposed":[103,155,217],"approach,":[104],"track":[107],"sequence":[112],"elements,":[115],"presence":[118],"scene":[122,233],"boundary":[123],"at":[124],"given":[126],"time":[127,152],"stamp":[128],"checked":[130],"pair-wise":[133],"measuring":[134],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">semantic</i>":[138],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">affinity</i>":[141],"between":[142,178],"different":[143],"parts":[144,181],"analyzed":[147],"stream":[149],"surrounding":[150],"that":[151,215],"stamp.":[153],"Our":[154],"model":[156],"for":[157],"affinity":[159],"exploits":[160],"proven":[162],"concepts":[163],"document":[166],"analysis,":[167],"introduced":[170],"here":[171],"function":[174],"distance":[177],"considered,":[182],"co-occurrence":[185],"statistics":[186],"importance":[189],"weights":[190],"elements":[194],"contained":[195],"therein.":[196],"Experimental":[197],"evaluation":[198],"performed":[199],"representative":[202],"set":[204],"consisting":[205],"5":[207],"h":[208],"diverse":[210],"streams":[213],"indicated":[214],"more":[220],"effective":[221],"than":[222],"approaches":[227],"solving":[229],"posed":[231],"segmentation":[234],"problem.":[235]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
