{"id":"https://openalex.org/W2085719526","doi":"https://doi.org/10.1109/icis.2014.6912172","title":"Joint speech/audio coding based scalable perceptual audio coding","display_name":"Joint speech/audio coding based scalable perceptual audio coding","publication_year":2014,"publication_date":"2014-06-01","ids":{"openalex":"https://openalex.org/W2085719526","doi":"https://doi.org/10.1109/icis.2014.6912172","mag":"2085719526"},"language":"en","primary_location":{"id":"doi:10.1109/icis.2014.6912172","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icis.2014.6912172","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE/ACIS 13th International Conference on Computer and Information Science (ICIS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072984216","display_name":"Li Gao","orcid":"https://orcid.org/0000-0002-5918-3505"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Li Gao","raw_affiliation_strings":["National Engineering Research Center for Multimedia Software, Computer School of Wuhan University, China","National Engineering Research Center for Multimedia Software; Computer School of Wuhan University; China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Multimedia Software, Computer School of Wuhan University, China","institution_ids":["https://openalex.org/I37461747"]},{"raw_affiliation_string":"National Engineering Research Center for Multimedia Software; Computer School of Wuhan University; China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087726516","display_name":"Ruimin Hu","orcid":"https://orcid.org/0000-0002-0290-5757"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruimin Hu","raw_affiliation_strings":["National Engineering Research Center for Multimedia Software, Computer School of Wuhan University, China","National Engineering Research Center for Multimedia Software; Computer School of Wuhan University; China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Multimedia Software, Computer School of Wuhan University, China","institution_ids":["https://openalex.org/I37461747"]},{"raw_affiliation_string":"National Engineering Research Center for Multimedia Software; Computer School of Wuhan University; China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102859655","display_name":"Yuhong Yang","orcid":"https://orcid.org/0000-0003-3001-7957"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuhong Yang","raw_affiliation_strings":["National Engineering Research Center for Multimedia Software, Computer School of Wuhan University, China","National Engineering Research Center for Multimedia Software; Computer School of Wuhan University; China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Multimedia Software, Computer School of Wuhan University, China","institution_ids":["https://openalex.org/I37461747"]},{"raw_affiliation_string":"National Engineering Research Center for Multimedia Software; Computer School of Wuhan University; China","institution_ids":["https://openalex.org/I37461747"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5072984216"],"corresponding_institution_ids":["https://openalex.org/I37461747"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14546505,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"429","last_page":"434"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9746000170707703,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7832047939300537},{"id":"https://openalex.org/keywords/speech-coding","display_name":"Speech coding","score":0.7755494117736816},{"id":"https://openalex.org/keywords/sub-band-coding","display_name":"Sub-band coding","score":0.6457803249359131},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6045252084732056},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.5952035188674927},{"id":"https://openalex.org/keywords/wideband-audio","display_name":"Wideband audio","score":0.553330659866333},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.511053204536438},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5060779452323914},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.48607566952705383},{"id":"https://openalex.org/keywords/adaptive-multi-rate-audio-codec","display_name":"Adaptive Multi-Rate audio codec","score":0.4670015573501587},{"id":"https://openalex.org/keywords/harmonic-vector-excitation-coding","display_name":"Harmonic Vector Excitation Coding","score":0.4190077483654022},{"id":"https://openalex.org/keywords/voice-activity-detection","display_name":"Voice activity detection","score":0.36202263832092285},{"id":"https://openalex.org/keywords/audio-signal","display_name":"Audio signal","score":0.35583391785621643},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.27887409925460815},{"id":"https://openalex.org/keywords/digital-audio","display_name":"Digital audio","score":0.2708876430988312},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.06357783079147339}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7832047939300537},{"id":"https://openalex.org/C13895895","wikidata":"https://www.wikidata.org/wiki/Q3270773","display_name":"Speech coding","level":2,"score":0.7755494117736816},{"id":"https://openalex.org/C98526533","wikidata":"https://www.wikidata.org/wiki/Q1691938","display_name":"Sub-band coding","level":3,"score":0.6457803249359131},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6045252084732056},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.5952035188674927},{"id":"https://openalex.org/C173391809","wikidata":"https://www.wikidata.org/wiki/Q2740189","display_name":"Wideband audio","level":5,"score":0.553330659866333},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.511053204536438},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5060779452323914},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.48607566952705383},{"id":"https://openalex.org/C177067256","wikidata":"https://www.wikidata.org/wiki/Q4676210","display_name":"Adaptive Multi-Rate audio codec","level":4,"score":0.4670015573501587},{"id":"https://openalex.org/C80167644","wikidata":"https://www.wikidata.org/wiki/Q463990","display_name":"Harmonic Vector Excitation Coding","level":3,"score":0.4190077483654022},{"id":"https://openalex.org/C204201278","wikidata":"https://www.wikidata.org/wiki/Q1332614","display_name":"Voice activity detection","level":3,"score":0.36202263832092285},{"id":"https://openalex.org/C64922751","wikidata":"https://www.wikidata.org/wiki/Q4650799","display_name":"Audio signal","level":3,"score":0.35583391785621643},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.27887409925460815},{"id":"https://openalex.org/C87687168","wikidata":"https://www.wikidata.org/wiki/Q173114","display_name":"Digital audio","level":4,"score":0.2708876430988312},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.06357783079147339},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icis.2014.6912172","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icis.2014.6912172","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE/ACIS 13th International Conference on Computer and Information Science (ICIS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":4,"referenced_works":["https://openalex.org/W1539500535","https://openalex.org/W2125698390","https://openalex.org/W2138422448","https://openalex.org/W2166217673"],"related_works":["https://openalex.org/W2042028224","https://openalex.org/W2106874932","https://openalex.org/W1877515347","https://openalex.org/W1857623347","https://openalex.org/W1578591928","https://openalex.org/W2111280847","https://openalex.org/W2115236569","https://openalex.org/W2154660412","https://openalex.org/W2980446847","https://openalex.org/W1936271610"],"abstract_inverted_index":{"With":[0],"the":[1,87,91,99,115,119,131],"technical":[2],"evolution":[3],"of":[4,24,48,122],"global":[5],"mobile":[6,107],"communications,":[7],"various":[8],"heterogeneous":[9],"communication":[10],"environments,":[11],"frequently":[12],"fluctuant":[13],"bandwidth":[14,93],"and":[15,51,56,74,90,130],"multiform":[16],"signals":[17,47],"put":[18],"new":[19],"challenges":[20],"to":[21,101],"coding":[22,37,45,66,72],"technology":[23],"multimedia":[25,61,108],"signals.":[26],"Scalable":[27],"Audio":[28],"Coding":[29],"(SAC)":[30],"can":[31,52],"provide":[32],"smooth":[33],"transition":[34],"between":[35],"different":[36,49],"qualities,":[38],"which":[39],"is":[40,125,133],"an":[41,75],"optimal":[42],"choice":[43],"for":[44],"audio":[46,65,88],"types":[50],"produce":[53],"more":[54],"reliable":[55],"consistent":[57],"service":[58,104],"quality":[59,121],"in":[60,98,106],"communications.":[62],"A":[63],"scalable":[64],"system":[67,100],"based":[68,80],"on":[69,81],"joint":[70],"speech/audio":[71],"method":[73,124],"auditory":[76],"perceptual":[77],"importance":[78],"model":[79],"bit-plane":[82],"are":[83],"proposed":[84,123],"here.":[85],"Both":[86],"content":[89],"network":[92],"fluctuation":[94],"will":[95],"be":[96],"considered":[97],"obtain":[102],"stable":[103],"qualities":[105],"services.":[109],"Experimental":[110],"results":[111],"indicate":[112],"that":[113],"with":[114],"same":[116],"bit":[117],"rates":[118],"subjective":[120],"slightly":[126],"better":[127],"than":[128],"G.729.1":[129],"SNR":[132],"improved":[134],"by":[135],"0.3dB.":[136]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
