{"id":"https://openalex.org/W4415594183","doi":"https://doi.org/10.1109/taffc.2025.3625612","title":"Modeling Multimodal Depression Diagnosis From the Perspective of Local Depressive Representation","display_name":"Modeling Multimodal Depression Diagnosis From the Perspective of Local Depressive Representation","publication_year":2025,"publication_date":"2025-10-27","ids":{"openalex":"https://openalex.org/W4415594183","doi":"https://doi.org/10.1109/taffc.2025.3625612"},"language":null,"primary_location":{"id":"doi:10.1109/taffc.2025.3625612","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taffc.2025.3625612","pdf_url":null,"source":{"id":"https://openalex.org/S104780363","display_name":"IEEE Transactions on Affective Computing","issn_l":"1949-3045","issn":["1949-3045","2371-9850"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Affective Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012713499","display_name":"Junjie Liang","orcid":"https://orcid.org/0000-0003-4582-2393"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Junjie Liang","raw_affiliation_strings":["College of Computer Science and Engineering, Northeastern University, Shenyang, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Computer Science and Engineering, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101986227","display_name":"Peng Cao","orcid":"https://orcid.org/0000-0002-7859-2769"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peng Cao","raw_affiliation_strings":["College of Computer Science and Engineering, Northeastern University, Shenyang, China"],"raw_orcid":"https://orcid.org/0000-0002-7859-2769","affiliations":[{"raw_affiliation_string":"College of Computer Science and Engineering, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080539155","display_name":"Chongxiao Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chongxiao Wang","raw_affiliation_strings":["College of Computer Science and Engineering, Northeastern University, Shenyang, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Computer Science and Engineering, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017211677","display_name":"Jinzhu Yang","orcid":"https://orcid.org/0000-0002-7754-1273"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinzhu Yang","raw_affiliation_strings":["College of Computer Science and Engineering, Northeastern University, Shenyang, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Computer Science and Engineering, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100455849","display_name":"Fei Wang","orcid":"https://orcid.org/0000-0002-5982-2303"},"institutions":[{"id":"https://openalex.org/I4210109791","display_name":"Nanjing Brain Hospital","ror":"https://ror.org/01wcx2305","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210109791"]},{"id":"https://openalex.org/I83519826","display_name":"Nanjing Medical University","ror":"https://ror.org/059gcgy73","country_code":"CN","type":"education","lineage":["https://openalex.org/I83519826"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fei Wang","raw_affiliation_strings":["Early Intervention Unit, Department of Psychiatry, Affiliated Nanjing Brain Hospital, Nanjing Medical University, Nanjing, China","Early Intervention Unit, Department of Psychiatry Affiliated Nanjing Brain Hospital, Nanjing Medical University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0002-5982-2303","affiliations":[{"raw_affiliation_string":"Early Intervention Unit, Department of Psychiatry, Affiliated Nanjing Brain Hospital, Nanjing Medical University, Nanjing, China","institution_ids":["https://openalex.org/I4210109791","https://openalex.org/I83519826"]},{"raw_affiliation_string":"Early Intervention Unit, Department of Psychiatry Affiliated Nanjing Brain Hospital, Nanjing Medical University, Nanjing, China","institution_ids":["https://openalex.org/I4210109791"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053745515","display_name":"Osmar R. Za\u0131\u0308ane","orcid":"https://orcid.org/0000-0002-0060-5988"},"institutions":[{"id":"https://openalex.org/I154425047","display_name":"University of Alberta","ror":"https://ror.org/0160cpw27","country_code":"CA","type":"education","lineage":["https://openalex.org/I154425047"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Osmar R. Zaiane","raw_affiliation_strings":["Department of Computing Science, University of Alberta, Edmonton, AB, Canada","department of Computing Science at the University of Alberta, Canada"],"raw_orcid":"https://orcid.org/0000-0002-0060-5988","affiliations":[{"raw_affiliation_string":"Department of Computing Science, University of Alberta, Edmonton, AB, Canada","institution_ids":["https://openalex.org/I154425047"]},{"raw_affiliation_string":"department of Computing Science at the University of Alberta, Canada","institution_ids":["https://openalex.org/I154425047"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5012713499"],"corresponding_institution_ids":["https://openalex.org/I9224756"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.30494569,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"17","issue":"1","first_page":"497","last_page":"510"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11148","display_name":"Language, Metaphor, and Cognition","score":0.7712000012397766,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11148","display_name":"Language, Metaphor, and Cognition","score":0.7712000012397766,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13795","display_name":"Language, Communication, and Linguistic Studies","score":0.6592000126838684,"subfield":{"id":"https://openalex.org/subfields/3315","display_name":"Communication"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T14512","display_name":"Technology and Human Factors in Education and Health","score":0.6402000188827515,"subfield":{"id":"https://openalex.org/subfields/2739","display_name":"Public Health, Environmental and Occupational Health"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.555899977684021},{"id":"https://openalex.org/keywords/affective-computing","display_name":"Affective computing","score":0.5544000267982483},{"id":"https://openalex.org/keywords/mood","display_name":"Mood","score":0.534600019454956},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.49720001220703125},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.48919999599456787},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.47780001163482666},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.45019999146461487},{"id":"https://openalex.org/keywords/major-depressive-disorder","display_name":"Major depressive disorder","score":0.41519999504089355},{"id":"https://openalex.org/keywords/limiting","display_name":"Limiting","score":0.3758000135421753}],"concepts":[{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.555899977684021},{"id":"https://openalex.org/C6438553","wikidata":"https://www.wikidata.org/wiki/Q1185804","display_name":"Affective computing","level":2,"score":0.5544000267982483},{"id":"https://openalex.org/C2780733359","wikidata":"https://www.wikidata.org/wiki/Q331769","display_name":"Mood","level":2,"score":0.534600019454956},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5166000127792358},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.49720001220703125},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.48919999599456787},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4832000136375427},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.47780001163482666},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.45509999990463257},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.45019999146461487},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.4478999972343445},{"id":"https://openalex.org/C2780051608","wikidata":"https://www.wikidata.org/wiki/Q42844","display_name":"Major depressive disorder","level":3,"score":0.41519999504089355},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.400299996137619},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.3758000135421753},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.36570000648498535},{"id":"https://openalex.org/C2776867660","wikidata":"https://www.wikidata.org/wiki/Q1814941","display_name":"Depression (economics)","level":2,"score":0.36320000886917114},{"id":"https://openalex.org/C2776289891","wikidata":"https://www.wikidata.org/wiki/Q1931511","display_name":"Neglect","level":2,"score":0.34220001101493835},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.30880001187324524},{"id":"https://openalex.org/C3019858935","wikidata":"https://www.wikidata.org/wiki/Q4340209","display_name":"Depressive symptoms","level":3,"score":0.3034000098705292},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.299699991941452},{"id":"https://openalex.org/C117220453","wikidata":"https://www.wikidata.org/wiki/Q5172842","display_name":"Correlation","level":2,"score":0.29499998688697815},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.2939999997615814},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.28600001335144043},{"id":"https://openalex.org/C195704467","wikidata":"https://www.wikidata.org/wiki/Q327968","display_name":"Facial expression","level":2,"score":0.2824999988079071},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.2800999879837036},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.2773999869823456},{"id":"https://openalex.org/C2780660688","wikidata":"https://www.wikidata.org/wiki/Q25052564","display_name":"Multimodal learning","level":2,"score":0.2727000117301941},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.2651999890804291}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taffc.2025.3625612","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taffc.2025.3625612","pdf_url":null,"source":{"id":"https://openalex.org/S104780363","display_name":"IEEE Transactions on Affective Computing","issn_l":"1949-3045","issn":["1949-3045","2371-9850"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Affective Computing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2483983123","display_name":null,"funder_award_id":"62076059","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4746588107","display_name":null,"funder_award_id":"N25BJD005","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Depression":[0,69],"recognition":[1,71],"is":[2],"critical":[3],"for":[4,225],"early":[5],"detection":[6],"and":[7,36,50,100,142,151,186,192,203,218],"treatment.":[8],"Existing":[9],"works":[10],"focus":[11,219],"on":[12,172,189,220],"modeling":[13],"coarse-grained":[14],"multimodal":[15,60,134,147],"representation":[16],"to":[17,93,112,161,183],"estimate":[18],"the":[19,27,46,57,80,114,126,132,137,163,190,196],"depression":[20],"level.":[21],"However,":[22],"these":[23],"approaches":[24],"often":[25],"overlook":[26],"inherent":[28],"locality":[29],"of":[30,53,59,82,116,122,139],"depressive":[31,38,83,98,123,216,228],"representation,":[32],"resulting":[33],"in":[34,166],"weak":[35],"sparse":[37],"frames":[39],"being":[40],"overlooked.":[41],"In":[42],"addition,":[43],"they":[44],"neglect":[45],"inter":[47],"modal":[48],"correlations":[49],"intra-modal":[51,143],"patterns":[52],"mood":[54],"change,":[55],"limiting":[56],"learning":[58],"complementary":[61],"information.":[62],"Therefore,":[63],"we":[64,85,105,155],"present":[65],"a":[66,157,200],"Locality-Aware":[67],"Multimodal":[68],"(LAMD)":[70],"model.":[72],"Specifically,":[73],"LAMD":[74,177,212],"contains":[75],"three":[76],"innovations:":[77],"1)":[78],"Considering":[79],"sparsity":[81],"features,":[84],"propose":[86,156],"an":[87],"Adaptive":[88],"Temporal":[89],"Attention":[90],"(ATA)":[91],"module":[92],"adaptively":[94,214],"highlight":[95],"keyframes":[96,217],"with":[97,181],"features":[99,124],"suppress":[101],"irrelevant":[102],"frames.":[103],"Additionally,":[104],"introduce":[106],"Segment":[107],"Information":[108],"Sharing":[109],"(SIS)":[110],"strategy":[111],"overcome":[113],"limitation":[115],"inter-segment":[117],"independence,":[118],"enabling":[119],"global":[120],"awareness":[121],"within":[125],"whole":[127],"segment.":[128],"2)":[129],"We":[130],"revisit":[131],"audio-video":[133],"interaction":[135],"from":[136],"perspectives":[138],"inter-modal":[140,164],"correlation":[141],"smoothness,":[144],"introducing":[145],"frame-level":[146],"attention":[148,160],"consistency":[149],"constraints":[150],"smooth":[152],"constraints.":[153],"Furthermore,":[154],"local":[158],"cross":[159],"enhance":[162],"interactions":[165],"adjacent":[167],"time.":[168],"3)":[169],"Extensive":[170],"experiments":[171],"several":[173],"datasets":[174],"demonstrate":[175],"that":[176,211],"achieves":[178],"superior":[179],"performance,":[180],"up":[182],"7.21":[184],"RMSE":[185],"76.77%":[187],"F1-score":[188],"AVEC2014":[191],"NJAD":[193],"dataset,":[194],"outperforming":[195],"prior":[197],"art":[198],"by":[199],"notable":[201],"0.22%":[202],"1.88%":[204],"margin,":[205],"respectively.":[206],"Moreover,":[207],"visual":[208],"analysis":[209],"reveals":[210],"can":[213],"perceive":[215],"fine-grained":[221],"facial":[222],"regions":[223],"known":[224],"capturing":[226],"subtle":[227],"expressions.":[229]},"counts_by_year":[],"updated_date":"2026-03-03T06:13:14.889584","created_date":"2025-10-28T00:00:00"}
