{"id":"https://openalex.org/W3158464566","doi":"https://doi.org/10.1109/waspaa52581.2021.9632668","title":"Point Cloud Audio Processing","display_name":"Point Cloud Audio Processing","publication_year":2021,"publication_date":"2021-10-17","ids":{"openalex":"https://openalex.org/W3158464566","doi":"https://doi.org/10.1109/waspaa52581.2021.9632668","mag":"3158464566"},"language":"en","primary_location":{"id":"doi:10.1109/waspaa52581.2021.9632668","is_oa":false,"landing_page_url":"https://doi.org/10.1109/waspaa52581.2021.9632668","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2105.02469","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5042472021","display_name":"Krishna Subramani","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Krishna Subramani","raw_affiliation_strings":["University of Illinois at Urbana-Champaign"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038903729","display_name":"Paris Smaragdis","orcid":null},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]},{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Paris Smaragdis","raw_affiliation_strings":["Adobe Research","University of Illinois at Urbana-Champaign"],"affiliations":[{"raw_affiliation_string":"Adobe Research","institution_ids":["https://openalex.org/I1306409833"]},{"raw_affiliation_string":"University of Illinois at Urbana-Champaign","institution_ids":["https://openalex.org/I157725225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5042472021"],"corresponding_institution_ids":["https://openalex.org/I157725225"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.04100396,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"31","last_page":"35"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9933000206947327,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.9915000200271606,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7026804685592651},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.6150736212730408},{"id":"https://openalex.org/keywords/audio-signal","display_name":"Audio signal","score":0.5921183228492737},{"id":"https://openalex.org/keywords/point-cloud","display_name":"Point cloud","score":0.520685076713562},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.4620055556297302},{"id":"https://openalex.org/keywords/audio-signal-processing","display_name":"Audio signal processing","score":0.44451627135276794},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.41504448652267456},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.41422832012176514},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.39260584115982056},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.34022825956344604},{"id":"https://openalex.org/keywords/speech-coding","display_name":"Speech coding","score":0.2445710301399231},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.19349539279937744},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.16337177157402039}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7026804685592651},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.6150736212730408},{"id":"https://openalex.org/C64922751","wikidata":"https://www.wikidata.org/wiki/Q4650799","display_name":"Audio signal","level":3,"score":0.5921183228492737},{"id":"https://openalex.org/C131979681","wikidata":"https://www.wikidata.org/wiki/Q1899648","display_name":"Point cloud","level":2,"score":0.520685076713562},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.4620055556297302},{"id":"https://openalex.org/C127220857","wikidata":"https://www.wikidata.org/wiki/Q2719318","display_name":"Audio signal processing","level":4,"score":0.44451627135276794},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.41504448652267456},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.41422832012176514},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39260584115982056},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.34022825956344604},{"id":"https://openalex.org/C13895895","wikidata":"https://www.wikidata.org/wiki/Q3270773","display_name":"Speech coding","level":2,"score":0.2445710301399231},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.19349539279937744},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.16337177157402039},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/waspaa52581.2021.9632668","is_oa":false,"landing_page_url":"https://doi.org/10.1109/waspaa52581.2021.9632668","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2105.02469","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2105.02469","pdf_url":"https://arxiv.org/pdf/2105.02469","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:3158464566","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/2105.02469.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.2105.02469","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2105.02469","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2105.02469","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2105.02469","pdf_url":"https://arxiv.org/pdf/2105.02469","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1904365287","https://openalex.org/W2052666245","https://openalex.org/W2519887557","https://openalex.org/W2624503621","https://openalex.org/W2626778328","https://openalex.org/W2890848214","https://openalex.org/W2898360221","https://openalex.org/W2902302021","https://openalex.org/W2950642167","https://openalex.org/W2952433032","https://openalex.org/W2953273646","https://openalex.org/W2965960151","https://openalex.org/W2979750740","https://openalex.org/W3034442691","https://openalex.org/W6631190155","https://openalex.org/W6640036494","https://openalex.org/W6726873649","https://openalex.org/W6739778489","https://openalex.org/W6739901393","https://openalex.org/W6747904511","https://openalex.org/W6755477022","https://openalex.org/W6766159569","https://openalex.org/W6779459325"],"related_works":["https://openalex.org/W3116892833","https://openalex.org/W3160191260","https://openalex.org/W3177013509","https://openalex.org/W1575005467","https://openalex.org/W1858125052","https://openalex.org/W2771726741","https://openalex.org/W753830768","https://openalex.org/W2227972867","https://openalex.org/W2963452667","https://openalex.org/W1965720553","https://openalex.org/W1590352240","https://openalex.org/W1521144119","https://openalex.org/W3170094039","https://openalex.org/W2962981281","https://openalex.org/W2948211236","https://openalex.org/W3090288500","https://openalex.org/W3015635148","https://openalex.org/W2324934107","https://openalex.org/W2774097455","https://openalex.org/W3187219273"],"abstract_inverted_index":{"Most":[0],"audio":[1,39,59,77,102],"processing":[2,101],"pipelines":[3],"involve":[4],"transformations":[5],"that":[6,70,123,144],"act":[7],"on":[8,58],"fixed-dimensional":[9],"input":[10,33,86,158],"representations":[11],"of":[12,55,84,100,110,130],"audio.":[13],"For":[14],"example,":[15],"when":[16],"using":[17],"the":[18,24,32,53,71,76,82,85,89,128,138,157],"Short":[19],"Time":[20],"Fourier":[21],"Transform":[22],"(STFT)":[23],"DFT":[25,135],"size":[26,136],"specifies":[27],"a":[28,36,97,108,164],"fixed":[29],"dimension":[30],"for":[31],"representation.":[34],"As":[35],"consequence,":[37],"most":[38],"machine":[40,120],"learning":[41,121],"models":[42,57,122],"are":[43],"designed":[44],"to":[45,81,127,154,163],"process":[46],"fixed-size":[47],"vector":[48],"inputs":[49],"which":[50],"often":[51],"prohibits":[52],"repurposing":[54],"learned":[56],"with":[60,160],"different":[61],"sampling":[62,90,139],"rates":[63],"or":[64,88,137],"alternative":[65],"representations.":[66],"We":[67],"note,":[68],"however,":[69],"intrinsic":[72],"spectral":[73],"information":[74],"in":[75,112,148],"signal":[78],"is":[79],"invariant":[80],"choice":[83,129],"representation":[87,131,159],"rate.":[91,140],"Motivated":[92],"by":[93,104],"this,":[94],"we":[95,116,142],"introduce":[96],"novel":[98],"way":[99],"signals":[103],"treating":[105],"them":[106],"as":[107,134],"collection":[109],"points":[111],"feature":[113],"space,":[114],"and":[115,151],"use":[117],"point":[118],"cloud":[119],"give":[124],"us":[125,153],"invariance":[126],"parameters,":[132],"such":[133],"Additionally,":[141],"observe":[143],"these":[145],"methods":[146],"result":[147],"smaller":[149],"models,":[150],"allow":[152],"significantly":[155],"subsample":[156],"minimal":[161],"effects":[162],"trained":[165],"model":[166],"performance.":[167]},"counts_by_year":[],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
