{"id":"https://openalex.org/W4285203769","doi":"https://doi.org/10.1109/taslp.2022.3171969","title":"An Efficient Algorithm for Segmenting Quasi-Periodic Digital Signals Into Pseudo Cycles: Application in Lossy Audio Compression","display_name":"An Efficient Algorithm for Segmenting Quasi-Periodic Digital Signals Into Pseudo Cycles: Application in Lossy Audio Compression","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4285203769","doi":"https://doi.org/10.1109/taslp.2022.3171969"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2022.3171969","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2022.3171969","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031029948","display_name":"Carlos Henrique Tarjano Santos","orcid":"https://orcid.org/0000-0003-3134-2778"},"institutions":[{"id":"https://openalex.org/I161127581","display_name":"Universidade Federal Fluminense","ror":"https://ror.org/02rjhbb08","country_code":"BR","type":"education","lineage":["https://openalex.org/I161127581"]}],"countries":["BR"],"is_corresponding":true,"raw_author_name":"Carlos Tarjano","raw_affiliation_strings":["Production Engineering Department, Universidade Federal Fluminense, Niteroi, RJ, Brazil"],"raw_orcid":"https://orcid.org/0000-0003-3134-2778","affiliations":[{"raw_affiliation_string":"Production Engineering Department, Universidade Federal Fluminense, Niteroi, RJ, Brazil","institution_ids":["https://openalex.org/I161127581"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5071593480","display_name":"Valdecy Pereira","orcid":"https://orcid.org/0000-0003-0599-8888"},"institutions":[{"id":"https://openalex.org/I161127581","display_name":"Universidade Federal Fluminense","ror":"https://ror.org/02rjhbb08","country_code":"BR","type":"education","lineage":["https://openalex.org/I161127581"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Valdecy Pereira","raw_affiliation_strings":["Production Engineering Department, Universidade Federal Fluminense, Niteroi, RJ, Brazil"],"raw_orcid":"https://orcid.org/0000-0003-0599-8888","affiliations":[{"raw_affiliation_string":"Production Engineering Department, Universidade Federal Fluminense, Niteroi, RJ, Brazil","institution_ids":["https://openalex.org/I161127581"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5031029948"],"corresponding_institution_ids":["https://openalex.org/I161127581"],"apc_list":null,"apc_paid":null,"fwci":0.4464,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.57546698,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"30","issue":null,"first_page":"1694","last_page":"1703"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/lossy-compression","display_name":"Lossy compression","score":0.7851974368095398},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7480913996696472},{"id":"https://openalex.org/keywords/codec","display_name":"Codec","score":0.6369465589523315},{"id":"https://openalex.org/keywords/sound-quality","display_name":"Sound quality","score":0.5696172118186951},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.5402931571006775},{"id":"https://openalex.org/keywords/lossless-compression","display_name":"Lossless compression","score":0.5266161561012268},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5206774473190308},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.48404544591903687},{"id":"https://openalex.org/keywords/audio-signal","display_name":"Audio signal","score":0.4834345579147339},{"id":"https://openalex.org/keywords/speech-coding","display_name":"Speech coding","score":0.4649352729320526},{"id":"https://openalex.org/keywords/dynamic-range-compression","display_name":"Dynamic range compression","score":0.43415576219558716},{"id":"https://openalex.org/keywords/digital-audio","display_name":"Digital audio","score":0.4329599142074585},{"id":"https://openalex.org/keywords/data-compression-ratio","display_name":"Data compression ratio","score":0.4146120548248291},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.24930429458618164},{"id":"https://openalex.org/keywords/image-compression","display_name":"Image compression","score":0.18680346012115479},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.11454865336418152},{"id":"https://openalex.org/keywords/image-processing","display_name":"Image processing","score":0.0923563539981842}],"concepts":[{"id":"https://openalex.org/C165021410","wikidata":"https://www.wikidata.org/wiki/Q55564","display_name":"Lossy compression","level":2,"score":0.7851974368095398},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7480913996696472},{"id":"https://openalex.org/C161765866","wikidata":"https://www.wikidata.org/wiki/Q184748","display_name":"Codec","level":2,"score":0.6369465589523315},{"id":"https://openalex.org/C167310288","wikidata":"https://www.wikidata.org/wiki/Q7564808","display_name":"Sound quality","level":2,"score":0.5696172118186951},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.5402931571006775},{"id":"https://openalex.org/C81081738","wikidata":"https://www.wikidata.org/wiki/Q55542","display_name":"Lossless compression","level":3,"score":0.5266161561012268},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5206774473190308},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.48404544591903687},{"id":"https://openalex.org/C64922751","wikidata":"https://www.wikidata.org/wiki/Q4650799","display_name":"Audio signal","level":3,"score":0.4834345579147339},{"id":"https://openalex.org/C13895895","wikidata":"https://www.wikidata.org/wiki/Q3270773","display_name":"Speech coding","level":2,"score":0.4649352729320526},{"id":"https://openalex.org/C150178126","wikidata":"https://www.wikidata.org/wiki/Q18433212","display_name":"Dynamic range compression","level":2,"score":0.43415576219558716},{"id":"https://openalex.org/C87687168","wikidata":"https://www.wikidata.org/wiki/Q173114","display_name":"Digital audio","level":4,"score":0.4329599142074585},{"id":"https://openalex.org/C94835093","wikidata":"https://www.wikidata.org/wiki/Q3113333","display_name":"Data compression ratio","level":5,"score":0.4146120548248291},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.24930429458618164},{"id":"https://openalex.org/C13481523","wikidata":"https://www.wikidata.org/wiki/Q412438","display_name":"Image compression","level":4,"score":0.18680346012115479},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.11454865336418152},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.0923563539981842},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2022.3171969","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2022.3171969","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W186826960","https://openalex.org/W403203070","https://openalex.org/W1496883935","https://openalex.org/W1560857892","https://openalex.org/W1697514459","https://openalex.org/W1728888090","https://openalex.org/W1969995484","https://openalex.org/W1978316435","https://openalex.org/W1979932443","https://openalex.org/W2002213065","https://openalex.org/W2019092077","https://openalex.org/W2019858047","https://openalex.org/W2029733930","https://openalex.org/W2038649911","https://openalex.org/W2090284173","https://openalex.org/W2096270777","https://openalex.org/W2097772361","https://openalex.org/W2109153336","https://openalex.org/W2140020944","https://openalex.org/W2167274237","https://openalex.org/W2382313035","https://openalex.org/W2408292770","https://openalex.org/W2587083256","https://openalex.org/W2611458801","https://openalex.org/W2623662528","https://openalex.org/W2647078120","https://openalex.org/W2775561228","https://openalex.org/W2785228337","https://openalex.org/W2792068891","https://openalex.org/W2802402824","https://openalex.org/W2912372306","https://openalex.org/W2951974815","https://openalex.org/W2964255696","https://openalex.org/W2969570307","https://openalex.org/W2991122796","https://openalex.org/W2997091880","https://openalex.org/W3037038648","https://openalex.org/W3131509212","https://openalex.org/W3198576000","https://openalex.org/W4250499635","https://openalex.org/W4255018581","https://openalex.org/W6630442970","https://openalex.org/W6633584340","https://openalex.org/W6635459924","https://openalex.org/W6636106077","https://openalex.org/W6638142982","https://openalex.org/W6697214680","https://openalex.org/W6757202746","https://openalex.org/W6764707986","https://openalex.org/W6986431730"],"related_works":["https://openalex.org/W1590604789","https://openalex.org/W4312624015","https://openalex.org/W2155254568","https://openalex.org/W2898469868","https://openalex.org/W4236707033","https://openalex.org/W2361662430","https://openalex.org/W2793211626","https://openalex.org/W4225318512","https://openalex.org/W2514468213","https://openalex.org/W2064800047"],"abstract_inverted_index":{"Signal":[0],"segmentation":[1,123],"is":[2,103,125,139,172,227],"used":[3,78,118,167],"in":[4,79,88,168,180],"many":[5],"areas,":[6],"from":[7,61,113],"audio":[8,89,132,233],"processing":[9],"to":[10,23,36,130,163,174,230],"health":[11],"applications,":[12],"and":[13,28,69,93,145,158,171,184,200,209,235,241],"consists":[14],"of":[15,72,95,155,213,245],"dividing":[16],"a":[17,41,47,153,201,210],"signal":[18,50,239],"into":[19,51],"segments,":[20],"homogeneous":[21],"according":[22,35],"given":[24],"metrics.":[25],"Those":[26],"metrics,":[27],"even":[29],"the":[30,56,66,70,106,114,142,214,225],"methods":[31],"used,":[32],"vary":[33],"substantially":[34],"each":[37,73],"application.":[38],"We":[39,222],"propose":[40],"general,":[42],"lower-level":[43],"algorithm":[44,124,226],"that":[45,224],"divides":[46],"quasi-periodic":[48],"digital":[49,96,169],"its":[52],"fundamental":[53],"building":[54],"blocks,":[55],"pseudo":[57,74],"cycles.":[58],"Features":[59],"derived":[60],"this":[62],"segmentation,":[63],"such":[64],"as":[65],"temporal":[67],"envelope":[68,236],"length":[71],"cycle,":[75],"can":[76,206,217],"be":[77,207,218],"further":[80],"tasks,":[81],"like":[82],"sound":[83],"compression,":[84],"with":[85,111,141,238],"direct":[86],"applications":[87],"streaming":[90],"bandwidth":[91],"reduction":[92],"compression":[94,150,196,234],"musical":[97],"instruments":[98],"sample":[99],"libraries.":[100],"The":[101,122],"method":[102],"based":[104],"on":[105,152],"sliding":[107],"discrete":[108],"Fourier":[109],"transform,":[110],"assumptions":[112],"circular":[115],"time-shift":[116],"theory":[117],"for":[119],"performance":[120],"improvements.":[121],"tested":[126],"via":[127],"an":[128],"application":[129],"lossy":[131,232],"compression.":[133],"This":[134],"implementation,":[135],"dubbed":[136],"Harmonic":[137],"Compression,":[138],"compared":[140],"MP3,":[143],"AAC,":[144],"Opus":[146],"codecs":[147,179],"at":[148],"similar":[149,195],"rates,":[151],"set":[154],"8":[156,159],"voice":[157],"instrument":[160],"signals":[161],"chosen":[162],"represent":[164],"typical":[165],"samples":[166],"instruments,":[170],"shown":[173],"perform":[175],"better":[176],"than":[177],"those":[178],"objective":[181],"quality":[182],"metrics":[183],"simulated":[185],"subjective":[186],"listening":[187],"tests,":[188],"exhibiting":[189],"faster":[190],"decoding":[191],"speeds":[192],"while":[193],"achieving":[194],"rates.":[197],"A":[198],"website":[199],"GitHub":[202],"repository,":[203],"where":[204],"results":[205],"heard":[208],"C++":[211],"implementation":[212],"proposed":[215],"codec":[216],"obtained,":[219],"are":[220],"available.":[221],"find":[223],"immediately":[228],"applicable":[229],"domain-specific":[231],"extraction,":[237],"classification":[240],"wavetable":[242],"matching":[243],"examples":[244],"other":[246],"potential":[247],"uses.":[248]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
