{"id":"https://openalex.org/W4409399598","doi":"https://doi.org/10.1587/transinf.2024edl8085","title":"TEFFDConv: An Improved Approach to Enhance Temporal Localization in Sound Event Detection","display_name":"TEFFDConv: An Improved Approach to Enhance Temporal Localization in Sound Event Detection","publication_year":2025,"publication_date":"2025-04-13","ids":{"openalex":"https://openalex.org/W4409399598","doi":"https://doi.org/10.1587/transinf.2024edl8085"},"language":"en","primary_location":{"id":"doi:10.1587/transinf.2024edl8085","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transinf.2024edl8085","pdf_url":"https://www.jstage.jst.go.jp/article/transinf/advpub/0/advpub_2024EDL8085/_pdf","source":{"id":"https://openalex.org/S2486202937","display_name":"IEICE Transactions on Information and Systems","issn_l":"0916-8532","issn":["0916-8532","1745-1361"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Information and Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://www.jstage.jst.go.jp/article/transinf/advpub/0/advpub_2024EDL8085/_pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015281297","display_name":"Xichang Cai","orcid":"https://orcid.org/0000-0003-1333-8812"},"institutions":[{"id":"https://openalex.org/I1456306","display_name":"North China University of Technology","ror":"https://ror.org/01nky7652","country_code":"CN","type":"education","lineage":["https://openalex.org/I1456306"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xichang CAI","raw_affiliation_strings":["Department of Electronic and Communication Engineering, North China University of Technology","North China University of Technology, Department of Electronic and Communication Engineering"],"affiliations":[{"raw_affiliation_string":"Department of Electronic and Communication Engineering, North China University of Technology","institution_ids":["https://openalex.org/I1456306"]},{"raw_affiliation_string":"North China University of Technology, Department of Electronic and Communication Engineering","institution_ids":["https://openalex.org/I1456306"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068761281","display_name":"Junfan Chen","orcid":"https://orcid.org/0009-0004-2898-482X"},"institutions":[{"id":"https://openalex.org/I1456306","display_name":"North China University of Technology","ror":"https://ror.org/01nky7652","country_code":"CN","type":"education","lineage":["https://openalex.org/I1456306"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingxuan CHEN","raw_affiliation_strings":["Department of Electronic and Communication Engineering, North China University of Technology","North China University of Technology, Department of Electronic and Communication Engineering"],"affiliations":[{"raw_affiliation_string":"Department of Electronic and Communication Engineering, North China University of Technology","institution_ids":["https://openalex.org/I1456306"]},{"raw_affiliation_string":"North China University of Technology, Department of Electronic and Communication Engineering","institution_ids":["https://openalex.org/I1456306"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100383203","display_name":"Ziyi Liu","orcid":"https://orcid.org/0000-0002-2407-9599"},"institutions":[{"id":"https://openalex.org/I1456306","display_name":"North China University of Technology","ror":"https://ror.org/01nky7652","country_code":"CN","type":"education","lineage":["https://openalex.org/I1456306"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ziyi LIU","raw_affiliation_strings":["Department of Electronic and Communication Engineering, North China University of Technology","North China University of Technology, Department of Electronic and Communication Engineering"],"affiliations":[{"raw_affiliation_string":"Department of Electronic and Communication Engineering, North China University of Technology","institution_ids":["https://openalex.org/I1456306"]},{"raw_affiliation_string":"North China University of Technology, Department of Electronic and Communication Engineering","institution_ids":["https://openalex.org/I1456306"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007631768","display_name":"Menglong Wu","orcid":"https://orcid.org/0000-0002-5438-9256"},"institutions":[{"id":"https://openalex.org/I1456306","display_name":"North China University of Technology","ror":"https://ror.org/01nky7652","country_code":"CN","type":"education","lineage":["https://openalex.org/I1456306"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Menglong WU","raw_affiliation_strings":["Department of Electronic and Communication Engineering, North China University of Technology","North China University of Technology, Department of Electronic and Communication Engineering"],"affiliations":[{"raw_affiliation_string":"Department of Electronic and Communication Engineering, North China University of Technology","institution_ids":["https://openalex.org/I1456306"]},{"raw_affiliation_string":"North China University of Technology, Department of Electronic and Communication Engineering","institution_ids":["https://openalex.org/I1456306"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032440097","display_name":"Hongyang Guo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"HongYang GUO","raw_affiliation_strings":["Beijing TimeTuring Technology Company"],"affiliations":[{"raw_affiliation_string":"Beijing TimeTuring Technology Company","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015760394","display_name":"Xinglong Sun","orcid":"https://orcid.org/0000-0003-4782-4966"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xuejing SUN","raw_affiliation_strings":["Beijing TimeTuring Technology Company"],"affiliations":[{"raw_affiliation_string":"Beijing TimeTuring Technology Company","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5015281297"],"corresponding_institution_ids":["https://openalex.org/I1456306"],"apc_list":null,"apc_paid":null,"fwci":2.9449,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.89746502,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"E108.D","issue":"10","first_page":"1250","last_page":"1254"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9742000102996826,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9702000021934509,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8687612414360046},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.6438805460929871},{"id":"https://openalex.org/keywords/sound","display_name":"Sound (geography)","score":0.48976993560791016},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3651106357574463},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3650498390197754},{"id":"https://openalex.org/keywords/real-time-computing","display_name":"Real-time computing","score":0.3447236716747284},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.20996597409248352}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8687612414360046},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.6438805460929871},{"id":"https://openalex.org/C203718221","wikidata":"https://www.wikidata.org/wiki/Q491713","display_name":"Sound (geography)","level":2,"score":0.48976993560791016},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3651106357574463},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3650498390197754},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.3447236716747284},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.20996597409248352},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1587/transinf.2024edl8085","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transinf.2024edl8085","pdf_url":"https://www.jstage.jst.go.jp/article/transinf/advpub/0/advpub_2024EDL8085/_pdf","source":{"id":"https://openalex.org/S2486202937","display_name":"IEICE Transactions on Information and Systems","issn_l":"0916-8532","issn":["0916-8532","1745-1361"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Information and Systems","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1587/transinf.2024edl8085","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transinf.2024edl8085","pdf_url":"https://www.jstage.jst.go.jp/article/transinf/advpub/0/advpub_2024EDL8085/_pdf","source":{"id":"https://openalex.org/S2486202937","display_name":"IEICE Transactions on Information and Systems","issn_l":"0916-8532","issn":["0916-8532","1745-1361"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Information and Systems","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4409399598.pdf","grobid_xml":"https://content.openalex.org/works/W4409399598.grobid-xml"},"referenced_works_count":19,"referenced_works":["https://openalex.org/W2511089602","https://openalex.org/W2591013610","https://openalex.org/W2592691248","https://openalex.org/W2936774411","https://openalex.org/W2972922917","https://openalex.org/W2979507862","https://openalex.org/W3006275583","https://openalex.org/W3133954504","https://openalex.org/W3162176995","https://openalex.org/W3203468141","https://openalex.org/W4221149441","https://openalex.org/W4224920041","https://openalex.org/W4225331914","https://openalex.org/W4321594243","https://openalex.org/W4390832422","https://openalex.org/W4402979321","https://openalex.org/W6743731764","https://openalex.org/W6745136726","https://openalex.org/W6794880463"],"related_works":["https://openalex.org/W2909726438","https://openalex.org/W2067046791","https://openalex.org/W2909888262","https://openalex.org/W2025747832","https://openalex.org/W3020957235","https://openalex.org/W2056769785","https://openalex.org/W611303608","https://openalex.org/W4313595395","https://openalex.org/W2312783472","https://openalex.org/W2909748163"],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"convolutional":[3,23],"recurrent":[4,28],"neural":[5,24,29],"networks":[6,25,30],"(CRNNs)":[7],"have":[8],"achieved":[9],"notable":[10,106],"success":[11],"in":[12,38,43,131,141],"sound":[13,84],"event":[14,142],"detection":[15],"(SED)":[16],"tasks":[17],"by":[18],"leveraging":[19],"the":[20,39,75,79,87,113,124,138],"strengths":[21],"of":[22,127],"(CNNs)":[26],"and":[27,70,100,102],"(RNNs).":[31],"However,":[32],"existing":[33],"models":[34],"still":[35],"face":[36],"limitations":[37],"temporal":[40,45,69,133],"dimension,":[41],"resulting":[42],"suboptimal":[44],"localization":[46],"accuracy":[47],"for":[48],"SED.":[49],"To":[50],"address":[51],"this":[52],"issue,":[53],"we":[54],"designed":[55],"a":[56,105],"model":[57,66,96],"called":[58],"Temporal":[59],"Enhanced":[60],"Full-Frequency":[61],"Dynamic":[62],"Convolution":[63],"(TEFFDConv).":[64],"This":[65],"incorporates":[67],"both":[68],"frequency":[71],"attention":[72],"mechanisms":[73],"with":[74],"full-dynamic":[76],"convolution,":[77],"enhancing":[78,132],"model's":[80],"ability":[81],"to":[82,109],"localize":[83],"events":[85],"at":[86],"frame":[88],"level.":[89],"Experimental":[90],"results":[91,122],"demonstrate":[92],"that":[93],"our":[94,128],"proposed":[95,129],"significantly":[97],"improved":[98],"PSDS1":[99],"CB-F1":[101],"IB-F1,":[103],"marking":[104],"advancement":[107],"compared":[108],"similar":[110],"methods.":[111,120],"Additionally,":[112],"PSDS2":[114],"also":[115,136],"showed":[116],"improvements":[117],"over":[118],"most":[119],"These":[121],"show":[123],"superior":[125],"performance":[126,140],"method":[130],"localization,":[134],"while":[135],"demonstrating":[137],"better":[139],"classification.":[143]},"counts_by_year":[{"year":2026,"cited_by_count":2}],"updated_date":"2026-04-01T17:29:45.350535","created_date":"2025-10-10T00:00:00"}
