{"id":"https://openalex.org/W4394896988","doi":"https://doi.org/10.1109/tetci.2024.3386619","title":"From Discrete Representation to Continuous Modeling: A Novel Audio-Visual Saliency Prediction Model With Implicit Neural Representations","display_name":"From Discrete Representation to Continuous Modeling: A Novel Audio-Visual Saliency Prediction Model With Implicit Neural Representations","publication_year":2024,"publication_date":"2024-04-17","ids":{"openalex":"https://openalex.org/W4394896988","doi":"https://doi.org/10.1109/tetci.2024.3386619"},"language":"en","primary_location":{"id":"doi:10.1109/tetci.2024.3386619","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tetci.2024.3386619","pdf_url":null,"source":{"id":"https://openalex.org/S4210210251","display_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","issn_l":"2471-285X","issn":["2471-285X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5066581712","display_name":"Dandan Zhu","orcid":"https://orcid.org/0000-0001-6436-7088"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Dandan Zhu","raw_affiliation_strings":["Institute of AI Education, Shanghai East China Normal University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Institute of AI Education, Shanghai East China Normal University, Shanghai, China","institution_ids":["https://openalex.org/I66867065"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032888856","display_name":"Kaiwei Zhang","orcid":"https://orcid.org/0000-0002-1620-736X"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kaiwei Zhang","raw_affiliation_strings":["Institute of Image Communication and Network Engineering, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Institute of Image Communication and Network Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101790399","display_name":"Kun Zhu","orcid":"https://orcid.org/0000-0002-5773-5089"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]},{"id":"https://openalex.org/I1327237609","display_name":"Ministry of Education of the People's Republic of China","ror":"https://ror.org/01mv9t934","country_code":"CN","type":"government","lineage":["https://openalex.org/I1327237609","https://openalex.org/I4210127390"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kun Zhu","raw_affiliation_strings":["Key Laboratory of Embedded System and Service Computing, Ministry of Education, Shanghai, China","National (Province-Ministry Joint) Collaborative Innovation Center for Financial Network Security, Tongji University, Shanghai, China","Department of Computer Science and Technology, Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Embedded System and Service Computing, Ministry of Education, Shanghai, China","institution_ids":["https://openalex.org/I1327237609"]},{"raw_affiliation_string":"National (Province-Ministry Joint) Collaborative Innovation Center for Financial Network Security, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]},{"raw_affiliation_string":"Department of Computer Science and Technology, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109706271","display_name":"Nana Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I181326427","display_name":"Donghua University","ror":"https://ror.org/035psfh38","country_code":"CN","type":"education","lineage":["https://openalex.org/I181326427"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Nana Zhang","raw_affiliation_strings":["School of Computer Science and Technology, Donghua University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Donghua University, Shanghai, China","institution_ids":["https://openalex.org/I181326427"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069969191","display_name":"Weiping Ding","orcid":"https://orcid.org/0000-0002-3180-7347"},"institutions":[{"id":"https://openalex.org/I199305430","display_name":"Nantong University","ror":"https://ror.org/02afcvw97","country_code":"CN","type":"education","lineage":["https://openalex.org/I199305430"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weiping Ding","raw_affiliation_strings":["School of Computer and Science and Technology, Nantong University, Jiangsu, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Science and Technology, Nantong University, Jiangsu, China","institution_ids":["https://openalex.org/I199305430"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064168853","display_name":"Guangtao Zhai","orcid":"https://orcid.org/0000-0001-8165-9322"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guangtao Zhai","raw_affiliation_strings":["Institute of Image Communication and Network Engineering, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Institute of Image Communication and Network Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019708391","display_name":"Xiaokang Yang","orcid":"https://orcid.org/0000-0003-4029-3322"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaokang Yang","raw_affiliation_strings":["MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5066581712"],"corresponding_institution_ids":["https://openalex.org/I66867065"],"apc_list":null,"apc_paid":null,"fwci":1.9168,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.84541233,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"8","issue":"6","first_page":"4059","last_page":"4074"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12496","display_name":"Color perception and design","score":0.9509999752044678,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12496","display_name":"Color perception and design","score":0.9509999752044678,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12032","display_name":"Multisensory perception and integration","score":0.9445000290870667,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/audio-visual","display_name":"Audio visual","score":0.8141701221466064},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.7371151447296143},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6419041156768799},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.49525657296180725},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4475102722644806},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4143926203250885},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3972170948982239},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3583357334136963},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.10315263271331787}],"concepts":[{"id":"https://openalex.org/C3017588708","wikidata":"https://www.wikidata.org/wiki/Q758901","display_name":"Audio visual","level":2,"score":0.8141701221466064},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.7371151447296143},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6419041156768799},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49525657296180725},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4475102722644806},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4143926203250885},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3972170948982239},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3583357334136963},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.10315263271331787},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tetci.2024.3386619","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tetci.2024.3386619","pdf_url":null,"source":{"id":"https://openalex.org/S4210210251","display_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","issn_l":"2471-285X","issn":["2471-285X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4000000059604645,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[{"id":"https://openalex.org/G2100497217","display_name":null,"funder_award_id":"62377011","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2593208977","display_name":null,"funder_award_id":"62302337","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3711735600","display_name":null,"funder_award_id":"61976120","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4679026377","display_name":null,"funder_award_id":"BK20191445","funder_id":"https://openalex.org/F4320322769","funder_display_name":"Natural Science Foundation of Jiangsu Province"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322769","display_name":"Natural Science Foundation of Jiangsu Province","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":84,"referenced_works":["https://openalex.org/W1152443276","https://openalex.org/W2015394094","https://openalex.org/W2038121453","https://openalex.org/W2056135328","https://openalex.org/W2091008902","https://openalex.org/W2097926315","https://openalex.org/W2099329509","https://openalex.org/W2112902774","https://openalex.org/W2119577735","https://openalex.org/W2146290679","https://openalex.org/W2155479901","https://openalex.org/W2212216676","https://openalex.org/W2288514685","https://openalex.org/W2313180542","https://openalex.org/W2498738402","https://openalex.org/W2517304349","https://openalex.org/W2529272619","https://openalex.org/W2533370895","https://openalex.org/W2558906385","https://openalex.org/W2585592883","https://openalex.org/W2612135493","https://openalex.org/W2740797387","https://openalex.org/W2757028014","https://openalex.org/W2799077596","https://openalex.org/W2799498328","https://openalex.org/W2803610340","https://openalex.org/W2804743778","https://openalex.org/W2955060956","https://openalex.org/W2962965915","https://openalex.org/W2963581854","https://openalex.org/W2963985934","https://openalex.org/W2964114039","https://openalex.org/W2969741484","https://openalex.org/W2971688562","https://openalex.org/W2986131415","https://openalex.org/W2997304642","https://openalex.org/W2999458807","https://openalex.org/W3000351820","https://openalex.org/W3027773793","https://openalex.org/W3034287518","https://openalex.org/W3034873438","https://openalex.org/W3082657571","https://openalex.org/W3098092829","https://openalex.org/W3099561715","https://openalex.org/W3101840568","https://openalex.org/W3138095408","https://openalex.org/W3170655219","https://openalex.org/W3171371659","https://openalex.org/W3173531806","https://openalex.org/W3174865552","https://openalex.org/W3176679855","https://openalex.org/W3180059462","https://openalex.org/W3193319282","https://openalex.org/W3195161059","https://openalex.org/W3195588784","https://openalex.org/W3195875706","https://openalex.org/W4200150166","https://openalex.org/W4226157755","https://openalex.org/W4226403574","https://openalex.org/W4295936340","https://openalex.org/W4300078741","https://openalex.org/W4312431055","https://openalex.org/W4312796583","https://openalex.org/W4313165271","https://openalex.org/W4313350201","https://openalex.org/W4319998010","https://openalex.org/W4327662052","https://openalex.org/W4367032246","https://openalex.org/W4377971262","https://openalex.org/W4379380529","https://openalex.org/W4385686754","https://openalex.org/W4386076558","https://openalex.org/W6637373629","https://openalex.org/W6698589804","https://openalex.org/W6732940373","https://openalex.org/W6763249567","https://openalex.org/W6763480078","https://openalex.org/W6779753539","https://openalex.org/W6780179280","https://openalex.org/W6780879210","https://openalex.org/W6791346067","https://openalex.org/W6792571853","https://openalex.org/W6803493554","https://openalex.org/W6810226158"],"related_works":["https://openalex.org/W2271369634","https://openalex.org/W3147472394","https://openalex.org/W2047100085","https://openalex.org/W2350550760","https://openalex.org/W578794879","https://openalex.org/W2625296515","https://openalex.org/W3137890128","https://openalex.org/W1984634519","https://openalex.org/W4245955731","https://openalex.org/W2393726419"],"abstract_inverted_index":{"In":[0],"the":[1,16,22,26,102,158],"era":[2],"of":[3,18,37,80],"deep":[4],"learning,":[5],"audio-visual":[6,68,153,191],"saliency":[7,69,104,159,192],"prediction":[8,160],"is":[9,85],"still":[10],"in":[11,25,157,190],"its":[12],"infancy":[13],"due":[14],"to":[15,48,86,101],"complexity":[17],"video":[19,52,112,125],"signals":[20],"and":[21,40,54,120,143,167,171,187],"continuous":[23,140],"correlation":[24],"temporal":[27,141],"dimension.":[28],"Most":[29],"existing":[30],"approaches":[31],"treat":[32],"videos":[33,116],"as":[34,51],"3D":[35],"grids":[36],"RGB":[38],"values":[39],"model":[41,71,84,108,183],"them":[42],"using":[43],"discrete":[44],"neural":[45,75,95,131],"networks,":[46],"leading":[47],"issues":[49],"such":[50],"content-agnostic":[53],"sub-optimal":[55],"feature":[56,122,145,154],"representation":[57,146],"ability.":[58],"To":[59],"address":[60],"these":[61],"challenges,":[62],"we":[63,149],"propose":[64],"a":[65,93,129,151],"novel":[66],"dynamic-aware":[67],"(DAVS)":[70],"based":[72],"on":[73,177],"implicit":[74],"representations":[76],"(INRs).":[77],"The":[78],"core":[79],"our":[81,107,180],"proposed":[82,181],"DAVS":[83,182],"build":[87],"an":[88,110],"effective":[89],"mapping":[90],"by":[91],"exploiting":[92],"parametric":[94,130,152],"network":[96],"that":[97,114],"maps":[98],"space-time":[99],"coordinates":[100],"corresponding":[103],"values.":[105],"Specifically,":[106],"incorporates":[109],"INR-based":[111],"generator":[113,134],"decomposes":[115],"into":[117],"image,":[118],"motion,":[119],"audio":[121,172],"vectors,":[123],"learning":[124],"content-adaptive":[126],"features":[127],"via":[128],"network.":[132],"This":[133],"efficiently":[135],"encodes":[136],"videos,":[137],"naturally":[138],"models":[139],"dynamics,":[142],"enhances":[144],"capability.":[147],"Furthermore,":[148],"introduce":[150],"fusion":[155],"strategy":[156],"procedure,":[161],"enabling":[162],"intrinsic":[163],"interactions":[164],"between":[165],"modalities":[166],"adaptively":[168],"integrating":[169],"visual":[170],"cues.":[173],"Through":[174],"extensive":[175],"experiments":[176],"benchmark":[178],"datasets,":[179],"demonstrates":[184],"promising":[185],"performance":[186],"intriguing":[188],"properties":[189],"prediction.":[193]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
