{"id":"https://openalex.org/W4414404734","doi":"https://doi.org/10.1109/tcsvt.2025.3612697","title":"Multimodal Local Global Interaction Networks for Automatic Depression Severity Estimation","display_name":"Multimodal Local Global Interaction Networks for Automatic Depression Severity Estimation","publication_year":2025,"publication_date":"2025-09-22","ids":{"openalex":"https://openalex.org/W4414404734","doi":"https://doi.org/10.1109/tcsvt.2025.3612697"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2025.3612697","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2025.3612697","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5094262973","display_name":"Mingyue Niu","orcid":"https://orcid.org/0009-0000-5133-7525"},"institutions":[{"id":"https://openalex.org/I39333907","display_name":"Yanshan University","ror":"https://ror.org/02txfnf15","country_code":"CN","type":"education","lineage":["https://openalex.org/I39333907"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingyue Niu","raw_affiliation_strings":["School of Information Science and Engineering, Yanshan University, Qinhuangdao, Hebei, China","School of Information Science and Engineering, Yanshan University, Qinhuangdao, Hebei province, China"],"raw_orcid":"https://orcid.org/0009-0000-5133-7525","affiliations":[{"raw_affiliation_string":"School of Information Science and Engineering, Yanshan University, Qinhuangdao, Hebei, China","institution_ids":["https://openalex.org/I39333907"]},{"raw_affiliation_string":"School of Information Science and Engineering, Yanshan University, Qinhuangdao, Hebei province, China","institution_ids":["https://openalex.org/I39333907"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026412163","display_name":"Zhuhong Shao","orcid":"https://orcid.org/0000-0002-4847-282X"},"institutions":[{"id":"https://openalex.org/I96852419","display_name":"Capital Normal University","ror":"https://ror.org/005edt527","country_code":"CN","type":"education","lineage":["https://openalex.org/I96852419"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhuhong Shao","raw_affiliation_strings":["College of Information Engineering, Capital Normal University, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Information Engineering, Capital Normal University, Beijing, China","institution_ids":["https://openalex.org/I96852419"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026346396","display_name":"Yongjun He","orcid":"https://orcid.org/0000-0002-5156-651X"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongjun He","raw_affiliation_strings":["School of Computer Science and Technology, Harbin Institute of Technology, Harbin, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Harbin Institute of Technology, Harbin, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100744502","display_name":"Jianhua Tao","orcid":"https://orcid.org/0000-0002-0477-587X"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianhua Tao","raw_affiliation_strings":["Department of Automation, Tsinghua University, Beijing, China","Department of Automation, Tsinghua University, Bejing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Automation, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Department of Automation, Tsinghua University, Bejing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043060302","display_name":"Bj\u00f6rn W. Schuller","orcid":"https://orcid.org/0000-0002-6478-8699"},"institutions":[{"id":"https://openalex.org/I179225836","display_name":"University of Augsburg","ror":"https://ror.org/03p14d497","country_code":"DE","type":"education","lineage":["https://openalex.org/I179225836"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Bj\u00f6rn W. Schuller","raw_affiliation_strings":["ZD.B Chair of Embedded Intelligence for Health Care and Wellbeing, University of Augsburg, Augsburg, Germany","ZD.B. Chair of Embedded Intelligence for Health Care and Wellbeing, University of Augsburg, Augsburg, Germany"],"raw_orcid":"https://orcid.org/0000-0002-6478-8699","affiliations":[{"raw_affiliation_string":"ZD.B Chair of Embedded Intelligence for Health Care and Wellbeing, University of Augsburg, Augsburg, Germany","institution_ids":["https://openalex.org/I179225836"]},{"raw_affiliation_string":"ZD.B. Chair of Embedded Intelligence for Health Care and Wellbeing, University of Augsburg, Augsburg, Germany","institution_ids":["https://openalex.org/I179225836"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.7406,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.86668947,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"36","issue":"2","first_page":"2649","last_page":"2664"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12488","display_name":"Mental Health via Writing","score":0.9682000279426575,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12488","display_name":"Mental Health via Writing","score":0.9682000279426575,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.935699999332428,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9003000259399414,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/perceptron","display_name":"Perceptron","score":0.569599986076355},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5669999718666077},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.5410000085830688},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.4571000039577484},{"id":"https://openalex.org/keywords/vectorization","display_name":"Vectorization (mathematics)","score":0.4023999869823456},{"id":"https://openalex.org/keywords/interaction-network","display_name":"Interaction network","score":0.3644999861717224},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.3589000105857849},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3506999909877777},{"id":"https://openalex.org/keywords/estimation","display_name":"Estimation","score":0.34940001368522644}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7038999795913696},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5773000121116638},{"id":"https://openalex.org/C60908668","wikidata":"https://www.wikidata.org/wiki/Q690207","display_name":"Perceptron","level":3,"score":0.569599986076355},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5669999718666077},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.5410000085830688},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4999000132083893},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.4571000039577484},{"id":"https://openalex.org/C41681595","wikidata":"https://www.wikidata.org/wiki/Q7917855","display_name":"Vectorization (mathematics)","level":2,"score":0.4023999869823456},{"id":"https://openalex.org/C55105296","wikidata":"https://www.wikidata.org/wiki/Q841382","display_name":"Interaction network","level":3,"score":0.3644999861717224},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.3589000105857849},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3506999909877777},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.34940001368522644},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.3456999957561493},{"id":"https://openalex.org/C152139883","wikidata":"https://www.wikidata.org/wiki/Q252973","display_name":"Mutual information","level":2,"score":0.3398999869823456},{"id":"https://openalex.org/C51432778","wikidata":"https://www.wikidata.org/wiki/Q1259145","display_name":"Independent component analysis","level":2,"score":0.32659998536109924},{"id":"https://openalex.org/C38764148","wikidata":"https://www.wikidata.org/wiki/Q17098245","display_name":"Interaction information","level":2,"score":0.3264000117778778},{"id":"https://openalex.org/C179717631","wikidata":"https://www.wikidata.org/wiki/Q2991667","display_name":"Multilayer perceptron","level":3,"score":0.3262999951839447},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3237000107765198},{"id":"https://openalex.org/C135641252","wikidata":"https://www.wikidata.org/wiki/Q738567","display_name":"Multimodal interaction","level":2,"score":0.31450000405311584},{"id":"https://openalex.org/C2993807640","wikidata":"https://www.wikidata.org/wiki/Q103709453","display_name":"Attention network","level":2,"score":0.2928999960422516},{"id":"https://openalex.org/C2780806968","wikidata":"https://www.wikidata.org/wiki/Q6045196","display_name":"Interaction model","level":2,"score":0.2696000039577484},{"id":"https://openalex.org/C6438553","wikidata":"https://www.wikidata.org/wiki/Q1185804","display_name":"Affective computing","level":2,"score":0.26159998774528503},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.26109999418258667},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.2605000138282776},{"id":"https://openalex.org/C2987082051","wikidata":"https://www.wikidata.org/wiki/Q223642","display_name":"Human interaction","level":2,"score":0.2574000060558319},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.25589999556541443},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.2529999911785126}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2025.3612697","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2025.3612697","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1338786405","display_name":null,"funder_award_id":"62473111","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6039608666","display_name":null,"funder_award_id":"2023LGQN006","funder_id":"https://openalex.org/F4320329228","funder_display_name":"Science Research Foundation of Xijing University"},{"id":"https://openalex.org/G8276991870","display_name":null,"funder_award_id":"62576302","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320329228","display_name":"Science Research Foundation of Xijing University","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":66,"referenced_works":["https://openalex.org/W1976066595","https://openalex.org/W1988088279","https://openalex.org/W2021678994","https://openalex.org/W2027192823","https://openalex.org/W2056403322","https://openalex.org/W2084242110","https://openalex.org/W2091936017","https://openalex.org/W2095540482","https://openalex.org/W2102505790","https://openalex.org/W2346454595","https://openalex.org/W2519531315","https://openalex.org/W2592018447","https://openalex.org/W2805409402","https://openalex.org/W2889847952","https://openalex.org/W2977251593","https://openalex.org/W2981677410","https://openalex.org/W3003850414","https://openalex.org/W3004404036","https://openalex.org/W3048093647","https://openalex.org/W3094259155","https://openalex.org/W3097777922","https://openalex.org/W3154272446","https://openalex.org/W3155665398","https://openalex.org/W3178321902","https://openalex.org/W3197466182","https://openalex.org/W3215165842","https://openalex.org/W4200262469","https://openalex.org/W4206144048","https://openalex.org/W4214493665","https://openalex.org/W4225308041","https://openalex.org/W4225324845","https://openalex.org/W4285132306","https://openalex.org/W4285188301","https://openalex.org/W4285307867","https://openalex.org/W4290098820","https://openalex.org/W4296437558","https://openalex.org/W4310333988","https://openalex.org/W4312950730","https://openalex.org/W4320009770","https://openalex.org/W4321353437","https://openalex.org/W4368232813","https://openalex.org/W4379382445","https://openalex.org/W4381785813","https://openalex.org/W4384519140","https://openalex.org/W4385823099","https://openalex.org/W4386374821","https://openalex.org/W4386424478","https://openalex.org/W4387010698","https://openalex.org/W4387245349","https://openalex.org/W4387247768","https://openalex.org/W4389195633","https://openalex.org/W4390166761","https://openalex.org/W4393241163","https://openalex.org/W4400062066","https://openalex.org/W4405642781","https://openalex.org/W4406753812","https://openalex.org/W4407693149","https://openalex.org/W4408345731","https://openalex.org/W4408352874","https://openalex.org/W4408356758","https://openalex.org/W4408609454","https://openalex.org/W4408708355","https://openalex.org/W4409262129","https://openalex.org/W4409346332","https://openalex.org/W4409917236","https://openalex.org/W7124131577"],"related_works":[],"abstract_inverted_index":{"Physiological":[0],"studies":[1],"have":[2,22],"shown":[3],"that":[4],"differences":[5],"between":[6,74,112],"depressed":[7],"and":[8,16,25,65,76,80,134,176,197,215],"healthy":[9],"individuals":[10],"are":[11,44],"manifested":[12],"in":[13,163],"the":[14,35,49,67,71,85,89,104,115,136,145,178,183,195,202,221],"audio":[15,29],"video":[17,31],"modalities.":[18],"Hence,":[19],"some":[20],"researchers":[21],"combined":[23],"local":[24,75],"global":[26,77],"information":[27],"from":[28,167],"or":[30,40,57],"modality":[32],"to":[33,47,69,108,130,139,172,181,200],"obtain":[34,182],"unimodal":[36],"representation.":[37],"Attention":[38],"mechanisms":[39,56],"Multi-Layer":[41],"Perceptrons":[42],"(MLPs)":[43],"then":[45],"used":[46],"complete":[48],"fusion":[50],"of":[51,87,125,185,223],"different":[52],"representations.":[53,113],"However,":[54],"attention":[55,179],"MLPs":[58],"is":[59],"essentially":[60],"a":[61,97,153,164,169],"linear":[62,106],"aggregation":[63],"manner,":[64],"lacks":[66],"ability":[68,138],"explore":[70],"element-wise":[72,110],"interaction":[73,111,146],"representations":[78],"within":[79],"across":[81],"modalities,":[82],"which":[83,102,128],"affects":[84],"accuracy":[86],"estimating":[88],"depression":[90,141,188,218],"severity.":[91,189],"To":[92],"this":[93,191],"end,":[94],"we":[95,151,193],"propose":[96,152],"Representation":[98],"Interaction":[99,206],"(RI)":[100],"module,":[101],"uses":[103],"mutual":[105,123],"adjustment":[107],"achieve":[109,131],"Thus,":[114],"RI":[116,196],"module":[117,159],"can":[118],"be":[119],"seen":[120],"as":[121],"an":[122,186],"observation":[124],"two":[126],"representations,":[127,150,175],"helps":[129],"complementary":[132],"advantages":[133],"improve":[135],"model\u2019s":[137],"characterize":[140],"cues.":[142],"Furthermore,":[143],"since":[144],"process":[147],"generates":[148],"multiple":[149,174],"Multi-representation":[154],"Prediction":[155],"(MP)":[156],"module.":[157],"This":[158],"implements":[160],"multi-representation":[161],"vectorization":[162],"hierarchical":[165],"manner":[166],"summarizing":[168],"single":[170],"representation":[171],"aggregating":[173],"adopts":[177],"mechanism":[180],"estimation":[184],"individual":[187],"In":[190],"way,":[192],"use":[194],"MP":[198],"modules":[199],"construct":[201],"Multimodal":[203],"Local":[204],"Global":[205],"(MLGI)":[207],"network.":[208],"The":[209],"experimental":[210],"performance":[211],"on":[212],"AVEC":[213,216],"2013":[214],"2014":[217],"datasets":[219],"demonstrates":[220],"effectiveness":[222],"our":[224],"method.":[225]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
