{"id":"https://openalex.org/W7141108878","doi":"https://doi.org/10.1109/icce67443.2026.11449775","title":"Neural Imitation of Human Perceptual Response to High-Resolution Audio","display_name":"Neural Imitation of Human Perceptual Response to High-Resolution Audio","publication_year":2026,"publication_date":"2026-02-03","ids":{"openalex":"https://openalex.org/W7141108878","doi":"https://doi.org/10.1109/icce67443.2026.11449775"},"language":null,"primary_location":{"id":"doi:10.1109/icce67443.2026.11449775","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icce67443.2026.11449775","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE International Conference on Consumer Electronics (ICCE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5122119928","display_name":"Baicheng Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Baicheng Huang","raw_affiliation_strings":["Tsinghua University,Beijing,P. R. China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Beijing,P. R. China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130751042","display_name":"Xinyi Pan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210118516","display_name":"Conceptual Mindworks (United States)","ror":"https://ror.org/020ezhp63","country_code":"US","type":"company","lineage":["https://openalex.org/I4210118516"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xinyi Pan","raw_affiliation_strings":["Conceptual Computing,Cambridge,Massachusetts"],"affiliations":[{"raw_affiliation_string":"Conceptual Computing,Cambridge,Massachusetts","institution_ids":["https://openalex.org/I4210118516"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130816785","display_name":"Haiwei Chai","orcid":null},"institutions":[{"id":"https://openalex.org/I4210118516","display_name":"Conceptual Mindworks (United States)","ror":"https://ror.org/020ezhp63","country_code":"US","type":"company","lineage":["https://openalex.org/I4210118516"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Haiwei Chai","raw_affiliation_strings":["Conceptual Computing,Cambridge,Massachusetts"],"affiliations":[{"raw_affiliation_string":"Conceptual Computing,Cambridge,Massachusetts","institution_ids":["https://openalex.org/I4210118516"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130738198","display_name":"Dong Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210118516","display_name":"Conceptual Mindworks (United States)","ror":"https://ror.org/020ezhp63","country_code":"US","type":"company","lineage":["https://openalex.org/I4210118516"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dong Liu","raw_affiliation_strings":["Conceptual Computing,Cambridge,Massachusetts"],"affiliations":[{"raw_affiliation_string":"Conceptual Computing,Cambridge,Massachusetts","institution_ids":["https://openalex.org/I4210118516"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130760517","display_name":"Feng Zhu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210118516","display_name":"Conceptual Mindworks (United States)","ror":"https://ror.org/020ezhp63","country_code":"US","type":"company","lineage":["https://openalex.org/I4210118516"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Feng Zhu","raw_affiliation_strings":["Conceptual Computing,Cambridge,Massachusetts"],"affiliations":[{"raw_affiliation_string":"Conceptual Computing,Cambridge,Massachusetts","institution_ids":["https://openalex.org/I4210118516"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5130750341","display_name":"Xiaoyong Pan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210118516","display_name":"Conceptual Mindworks (United States)","ror":"https://ror.org/020ezhp63","country_code":"US","type":"company","lineage":["https://openalex.org/I4210118516"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaoyong Pan","raw_affiliation_strings":["Conceptual Computing,Cambridge,Massachusetts"],"affiliations":[{"raw_affiliation_string":"Conceptual Computing,Cambridge,Massachusetts","institution_ids":["https://openalex.org/I4210118516"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5122119928"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.88574897,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.15160000324249268,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.15160000324249268,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12032","display_name":"Multisensory perception and integration","score":0.1492999941110611,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.13570000231266022,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.5023000240325928},{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.41290000081062317},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.2939000129699707},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.25859999656677246}],"concepts":[{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.5103999972343445},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.5023000240325928},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.41290000081062317},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.4043999910354614},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.39419999718666077},{"id":"https://openalex.org/C46312422","wikidata":"https://www.wikidata.org/wiki/Q11024","display_name":"Communication","level":1,"score":0.3314000070095062},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2955000102519989},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.2946999967098236},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.2939000129699707},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.25859999656677246}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icce67443.2026.11449775","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icce67443.2026.11449775","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE International Conference on Consumer Electronics (ICCE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/5","display_name":"Gender equality","score":0.7009300589561462}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":6,"referenced_works":["https://openalex.org/W2020997493","https://openalex.org/W2111460811","https://openalex.org/W2463323901","https://openalex.org/W3209059054","https://openalex.org/W4381786045","https://openalex.org/W7133219565"],"related_works":[],"abstract_inverted_index":{"Computer":[0],"audition":[1],"systems":[2],"based":[3],"on":[4,18,82],"neural":[5,123],"processing":[6,34],"provide":[7],"deep":[8],"perceptual":[9,33],"understanding":[10],"of":[11],"digital":[12],"audio":[13,37,50],"signals":[14],"but":[15],"often":[16],"rely":[17],"extensive":[19],"manual":[20],"annotation.":[21],"In":[22],"this":[23,99],"paper,":[24],"we":[25],"propose":[26],"an":[27],"unsupervised":[28,100],"framework":[29],"to":[30,47,63],"imitate":[31],"human":[32],"for":[35],"high-resolution":[36,85,108],"quality":[38],"assessment.":[39],"We":[40],"employ":[41],"a":[42],"data":[43],"format":[44],"conversion":[45],"method":[46],"quantize":[48],"continuous":[49],"waveforms":[51],"into":[52],"discrete":[53],"token":[54],"sequences.":[55],"A":[56],"Large":[57],"Language":[58],"Model":[59],"is":[60,80],"then":[61],"utilized":[62],"model":[64],"these":[65],"sequences":[66],"via":[67],"next-token":[68],"prediction,":[69],"capturing":[70],"complex":[71],"temporal":[72],"dependencies":[73],"without":[74],"labeled":[75],"data.":[76],"Higher":[77],"prediction":[78,93],"accuracy":[79],"observed":[81],"truly":[83],"recorded":[84],"content,":[86],"while":[87],"artificially":[88],"up-sampled":[89],"content":[90],"induces":[91],"significant":[92],"drops.":[94],"Experimental":[95],"results":[96,118],"demonstrate":[97],"that":[98],"approach":[101],"effectively":[102],"distinguishes":[103],"between":[104],"true":[105],"and":[106],"synthesized":[107],"audio.":[109],"Manual":[110],"verification":[111],"result":[112],"shows":[113],"strong":[114],"agreement":[115],"with":[116],"the":[117,121],"provided":[119],"by":[120],"proposed":[122],"model.":[124]},"counts_by_year":[],"updated_date":"2026-03-29T06:01:01.467347","created_date":"2026-03-28T00:00:00"}
