{"id":"https://openalex.org/W4386977577","doi":"https://doi.org/10.1145/3581783.3611853","title":"TMac: Temporal Multi-Modal Graph Learning for Acoustic Event Classification","display_name":"TMac: Temporal Multi-Modal Graph Learning for Acoustic Event Classification","publication_year":2023,"publication_date":"2023-10-26","ids":{"openalex":"https://openalex.org/W4386977577","doi":"https://doi.org/10.1145/3581783.3611853"},"language":"en","primary_location":{"id":"doi:10.1145/3581783.3611853","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3581783.3611853","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2309.11845","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100457574","display_name":"Meng Liu","orcid":"https://orcid.org/0000-0003-3900-4204"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Meng Liu","raw_affiliation_strings":["National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009525613","display_name":"Ke Liang","orcid":"https://orcid.org/0000-0002-4837-455X"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ke Liang","raw_affiliation_strings":["National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031767346","display_name":"Dayu Hu","orcid":"https://orcid.org/0000-0002-9369-7390"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dayu Hu","raw_affiliation_strings":["National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100647391","display_name":"Hao Yu","orcid":"https://orcid.org/0000-0001-9044-4841"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hao Yu","raw_affiliation_strings":["National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100320103","display_name":"Yue Liu","orcid":"https://orcid.org/0000-0002-9894-0062"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yue Liu","raw_affiliation_strings":["National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017200032","display_name":"Lingyuan Meng","orcid":"https://orcid.org/0000-0002-2489-573X"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lingyuan Meng","raw_affiliation_strings":["National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085607536","display_name":"Wenxuan Tu","orcid":"https://orcid.org/0000-0002-1353-2968"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenxuan Tu","raw_affiliation_strings":["National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032131582","display_name":"Sihang Zhou","orcid":"https://orcid.org/0000-0003-1491-4594"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sihang Zhou","raw_affiliation_strings":["National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101727888","display_name":"Xinwang Liu","orcid":"https://orcid.org/0000-0001-9066-1475"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinwang Liu","raw_affiliation_strings":["National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5100457574"],"corresponding_institution_ids":["https://openalex.org/I170215575"],"apc_list":null,"apc_paid":null,"fwci":5.6902,"has_fulltext":true,"cited_by_count":29,"citation_normalized_percentile":{"value":0.97118298,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"3365","last_page":"3374"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7918872237205505},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.7450648546218872},{"id":"https://openalex.org/keywords/timestamp","display_name":"Timestamp","score":0.6276869177818298},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.6029854416847229},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.5308260321617126},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46500903367996216},{"id":"https://openalex.org/keywords/temporal-database","display_name":"Temporal database","score":0.4175224304199219},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3466529846191406},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.34005576372146606},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3334069848060608},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.21958860754966736},{"id":"https://openalex.org/keywords/real-time-computing","display_name":"Real-time computing","score":0.15468651056289673}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7918872237205505},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.7450648546218872},{"id":"https://openalex.org/C113954288","wikidata":"https://www.wikidata.org/wiki/Q186885","display_name":"Timestamp","level":2,"score":0.6276869177818298},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.6029854416847229},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.5308260321617126},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46500903367996216},{"id":"https://openalex.org/C77277458","wikidata":"https://www.wikidata.org/wiki/Q1969246","display_name":"Temporal database","level":2,"score":0.4175224304199219},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3466529846191406},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.34005576372146606},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3334069848060608},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.21958860754966736},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.15468651056289673},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3581783.3611853","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3581783.3611853","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Multimedia","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2309.11845","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2309.11845","pdf_url":"https://arxiv.org/pdf/2309.11845","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2309.11845","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2309.11845","pdf_url":"https://arxiv.org/pdf/2309.11845","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1121271761","display_name":null,"funder_award_id":"Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2455478723","display_name":null,"funder_award_id":"62276271","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G391238517","display_name":null,"funder_award_id":", and","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5664600557","display_name":null,"funder_award_id":"62325604, 62276271","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5680782816","display_name":null,"funder_award_id":"62325604, 62276271","funder_id":"https://openalex.org/F4320334062","funder_display_name":"National Natural Science Foundation of China-Liaoning Joint Fund"},{"id":"https://openalex.org/G5729763073","display_name":null,"funder_award_id":"62325604","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320334062","display_name":"National Natural Science Foundation of China-Liaoning Joint Fund","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4386977577.pdf","grobid_xml":"https://content.openalex.org/works/W4386977577.grobid-xml"},"referenced_works_count":44,"referenced_works":["https://openalex.org/W267352410","https://openalex.org/W1501987291","https://openalex.org/W2065529590","https://openalex.org/W2146456494","https://openalex.org/W2511428026","https://openalex.org/W2529337537","https://openalex.org/W2619697695","https://openalex.org/W2808908091","https://openalex.org/W2963115079","https://openalex.org/W2963155035","https://openalex.org/W2965683718","https://openalex.org/W2982108874","https://openalex.org/W2998116985","https://openalex.org/W3012562343","https://openalex.org/W3012664577","https://openalex.org/W3037309139","https://openalex.org/W3094550259","https://openalex.org/W3154155788","https://openalex.org/W3162391496","https://openalex.org/W3175300676","https://openalex.org/W3182741322","https://openalex.org/W3190580390","https://openalex.org/W3210131246","https://openalex.org/W4220779330","https://openalex.org/W4225300652","https://openalex.org/W4226219101","https://openalex.org/W4285414370","https://openalex.org/W4285483676","https://openalex.org/W4285483774","https://openalex.org/W4290927845","https://openalex.org/W4297841792","https://openalex.org/W4306317449","https://openalex.org/W4379599555","https://openalex.org/W4382318469","https://openalex.org/W4382468415","https://openalex.org/W4385571579","https://openalex.org/W6600175564","https://openalex.org/W6600512042","https://openalex.org/W6601013545","https://openalex.org/W6603860191","https://openalex.org/W6629267907","https://openalex.org/W6818331381","https://openalex.org/W6825417173","https://openalex.org/W6840200333"],"related_works":["https://openalex.org/W2060561905","https://openalex.org/W1417711376","https://openalex.org/W2579899204","https://openalex.org/W2574209248","https://openalex.org/W2884490506","https://openalex.org/W2483088531","https://openalex.org/W2294686723","https://openalex.org/W2601871130","https://openalex.org/W2950359320","https://openalex.org/W2112128729"],"abstract_inverted_index":{"Audiovisual":[0],"data":[1,28,42,61,163,166],"is":[2,29,62,84,221],"everywhere":[3],"in":[4,55,74,86,202,217],"this":[5,124,193],"digital":[6],"age,":[7],"which":[8,72,110],"raises":[9],"higher":[10],"requirements":[11],"for":[12,52,91,134,156],"the":[13,23,26,30,49,56,112,179,199],"deep":[14],"learning":[15,132,147],"models":[16,216],"developed":[17],"on":[18,189],"them.":[19],"To":[20],"well":[21],"handle":[22],"information":[24,51,83,144,201],"of":[25,114],"multi-modal":[27,64,87],"key":[31],"to":[32,66,120,210],"a":[33,75,128,153,176],"better":[34],"audiovisual":[35,41],"modal.":[36],"We":[37],"observe":[38],"that":[39,81],"these":[40],"naturally":[43],"have":[44],"temporal":[45,82,115,143,154,180],"attributes,":[46],"such":[47,60,142],"as":[48,175,187],"time":[50],"each":[53,101,157],"frame":[54],"video.":[57],"More":[58],"concretely,":[59],"inherently":[63],"according":[65],"both":[67,92],"audio":[68,162],"and":[69,94,105,117,164,178,204],"visual":[70],"cues,":[71],"proceed":[73],"strict":[76],"chronological":[77],"order.":[78],"It":[79],"indicates":[80],"important":[85],"acoustic":[88,158],"event":[89,136],"modeling":[90,141],"intra-":[93],"inter-modal.":[95,205],"However,":[96],"existing":[97],"methods":[98],"deal":[99],"with":[100],"modal":[102],"feature":[103],"independently":[104],"simply":[106],"fuse":[107],"them":[108],"together,":[109],"neglects":[111],"mining":[113],"relation":[116],"thus":[118],"leads":[119],"sub-optimal":[121],"performance.":[122,218],"With":[123],"motivation,":[125],"we":[126,151,195],"propose":[127],"Temporal":[129],"Multi-modal":[130],"graph":[131,146,155],"method":[133],"Acoustic":[135],"Classification,":[137],"called":[138],"TMac,":[139],"by":[140],"via":[145],"techniques.":[148],"In":[149,192],"particular,":[150],"construct":[152],"event,":[159],"dividing":[160],"its":[161],"video":[165],"into":[167],"multiple":[168],"segments.":[169],"Each":[170],"segment":[171],"can":[172,184,196],"be":[173,185],"considered":[174,186],"node,":[177],"relationships":[181],"between":[182],"nodes":[183],"timestamps":[188],"their":[190],"edges.":[191],"case,":[194],"smoothly":[197],"capture":[198],"dynamic":[200],"intra-modal":[203],"Several":[206],"experiments":[207],"are":[208],"conducted":[209],"demonstrate":[211],"TMac":[212],"outperforms":[213],"other":[214],"SOTA":[215],"Our":[219],"code":[220],"available":[222],"at":[223],"https://github.com/MGitHubL/TMac.":[224]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":10},{"year":2024,"cited_by_count":11},{"year":2023,"cited_by_count":3}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
