{"id":"https://openalex.org/W4415524257","doi":"https://doi.org/10.1109/mlsp62443.2025.11204342","title":"GEMS: Group Emotion Profiling Through Multimodal Situational Understanding","display_name":"GEMS: Group Emotion Profiling Through Multimodal Situational Understanding","publication_year":2025,"publication_date":"2025-08-31","ids":{"openalex":"https://openalex.org/W4415524257","doi":"https://doi.org/10.1109/mlsp62443.2025.11204342"},"language":null,"primary_location":{"id":"doi:10.1109/mlsp62443.2025.11204342","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mlsp62443.2025.11204342","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE 35th International Workshop on Machine Learning for Signal Processing (MLSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5021223733","display_name":"Aman Kataria","orcid":"https://orcid.org/0000-0001-5634-3465"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Anubhav Kataria","raw_affiliation_strings":["Kroop AI"],"affiliations":[{"raw_affiliation_string":"Kroop AI","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078144481","display_name":"Surbhi Madan","orcid":"https://orcid.org/0009-0000-3774-8117"},"institutions":[{"id":"https://openalex.org/I119241673","display_name":"Indian Institute of Technology Ropar","ror":"https://ror.org/02qkhhn56","country_code":"IN","type":"education","lineage":["https://openalex.org/I119241673"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Surbhi Madan","raw_affiliation_strings":["IIT Ropar"],"affiliations":[{"raw_affiliation_string":"IIT Ropar","institution_ids":["https://openalex.org/I119241673"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034501904","display_name":"Shreya Ghosh","orcid":"https://orcid.org/0000-0002-2639-8374"},"institutions":[{"id":"https://openalex.org/I205640436","display_name":"Curtin University","ror":"https://ror.org/02n415q13","country_code":"AU","type":"education","lineage":["https://openalex.org/I205640436"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Shreya Ghosh","raw_affiliation_strings":["Curtin University"],"affiliations":[{"raw_affiliation_string":"Curtin University","institution_ids":["https://openalex.org/I205640436"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030379402","display_name":"Tom Gedeon","orcid":"https://orcid.org/0000-0001-8356-4909"},"institutions":[{"id":"https://openalex.org/I205640436","display_name":"Curtin University","ror":"https://ror.org/02n415q13","country_code":"AU","type":"education","lineage":["https://openalex.org/I205640436"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Tom Gedeon","raw_affiliation_strings":["Curtin University"],"affiliations":[{"raw_affiliation_string":"Curtin University","institution_ids":["https://openalex.org/I205640436"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5085376429","display_name":"Abhinav Dhall","orcid":"https://orcid.org/0000-0002-2230-1440"},"institutions":[{"id":"https://openalex.org/I2801239119","display_name":"Australian Regenerative Medicine Institute","ror":"https://ror.org/02qa5kg76","country_code":"AU","type":"facility","lineage":["https://openalex.org/I2801037857","https://openalex.org/I2801239119","https://openalex.org/I56590836"]},{"id":"https://openalex.org/I56590836","display_name":"Monash University","ror":"https://ror.org/02bfwt286","country_code":"AU","type":"education","lineage":["https://openalex.org/I56590836"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Abhinav Dhall","raw_affiliation_strings":["Monash University"],"affiliations":[{"raw_affiliation_string":"Monash University","institution_ids":["https://openalex.org/I2801239119","https://openalex.org/I56590836"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5021223733"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.16998893,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.5568000078201294,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.5568000078201294,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/situational-ethics","display_name":"Situational ethics","score":0.6302000284194946},{"id":"https://openalex.org/keywords/profiling","display_name":"Profiling (computer programming)","score":0.5249000191688538},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.5184000134468079},{"id":"https://openalex.org/keywords/comprehension","display_name":"Comprehension","score":0.5063999891281128},{"id":"https://openalex.org/keywords/valence","display_name":"Valence (chemistry)","score":0.5001000165939331},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.4821999967098236},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.41190001368522644},{"id":"https://openalex.org/keywords/focus-group","display_name":"Focus group","score":0.40790000557899475},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4000000059604645},{"id":"https://openalex.org/keywords/group","display_name":"Group (periodic table)","score":0.39309999346733093}],"concepts":[{"id":"https://openalex.org/C9114305","wikidata":"https://www.wikidata.org/wiki/Q1428317","display_name":"Situational ethics","level":2,"score":0.6302000284194946},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.571399986743927},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5608000159263611},{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.5249000191688538},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.5184000134468079},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.5063999891281128},{"id":"https://openalex.org/C168900304","wikidata":"https://www.wikidata.org/wiki/Q171407","display_name":"Valence (chemistry)","level":2,"score":0.5001000165939331},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.49079999327659607},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.4821999967098236},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.41190001368522644},{"id":"https://openalex.org/C56995899","wikidata":"https://www.wikidata.org/wiki/Q1126687","display_name":"Focus group","level":2,"score":0.40790000557899475},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4000000059604645},{"id":"https://openalex.org/C2781311116","wikidata":"https://www.wikidata.org/wiki/Q83306","display_name":"Group (periodic table)","level":2,"score":0.39309999346733093},{"id":"https://openalex.org/C2776141551","wikidata":"https://www.wikidata.org/wiki/Q16000087","display_name":"Emotion perception","level":3,"score":0.39149999618530273},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.3853999972343445},{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.36059999465942383},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.35420000553131104},{"id":"https://openalex.org/C2777438025","wikidata":"https://www.wikidata.org/wiki/Q1339090","display_name":"Emotion recognition","level":2,"score":0.3508000075817108},{"id":"https://openalex.org/C206310091","wikidata":"https://www.wikidata.org/wiki/Q750859","display_name":"Emotion classification","level":2,"score":0.34540000557899475},{"id":"https://openalex.org/C145804949","wikidata":"https://www.wikidata.org/wiki/Q478123","display_name":"Situation awareness","level":2,"score":0.34369999170303345},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.34119999408721924},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3366999924182892},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.3264000117778778},{"id":"https://openalex.org/C2776544517","wikidata":"https://www.wikidata.org/wiki/Q189447","display_name":"Unexpected events","level":2,"score":0.31709998846054077},{"id":"https://openalex.org/C108154423","wikidata":"https://www.wikidata.org/wiki/Q1469792","display_name":"Salience (neuroscience)","level":2,"score":0.311599999666214},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.3075000047683716},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.30300000309944153},{"id":"https://openalex.org/C180872759","wikidata":"https://www.wikidata.org/wiki/Q874405","display_name":"Social group","level":2,"score":0.2896000146865845},{"id":"https://openalex.org/C86658582","wikidata":"https://www.wikidata.org/wiki/Q1432778","display_name":"Social cognition","level":3,"score":0.28600001335144043},{"id":"https://openalex.org/C137878579","wikidata":"https://www.wikidata.org/wiki/Q9636076","display_name":"Joint attention","level":3,"score":0.28029999136924744},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.27219998836517334},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.2653999924659729},{"id":"https://openalex.org/C87156501","wikidata":"https://www.wikidata.org/wiki/Q7268708","display_name":"Qualitative property","level":2,"score":0.26350000500679016},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.2619999945163727},{"id":"https://openalex.org/C3018587665","wikidata":"https://www.wikidata.org/wiki/Q7268696","display_name":"Qualitative analysis","level":3,"score":0.26010000705718994},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.2574000060558319}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/mlsp62443.2025.11204342","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mlsp62443.2025.11204342","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE 35th International Workshop on Machine Learning for Signal Processing (MLSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1575132216","https://openalex.org/W1603712378","https://openalex.org/W2081112272","https://openalex.org/W2094637479","https://openalex.org/W2123328577","https://openalex.org/W2140296984","https://openalex.org/W2341528187","https://openalex.org/W2486404862","https://openalex.org/W2527646968","https://openalex.org/W2767348466","https://openalex.org/W2793312177","https://openalex.org/W2888683367","https://openalex.org/W2891628231","https://openalex.org/W2914481831","https://openalex.org/W2951556150","https://openalex.org/W2963962355","https://openalex.org/W2978756075","https://openalex.org/W2996209825","https://openalex.org/W3089214424","https://openalex.org/W3095255024","https://openalex.org/W3138516171","https://openalex.org/W3192648700","https://openalex.org/W4294214983","https://openalex.org/W4307045186","https://openalex.org/W4387129418","https://openalex.org/W4390905801","https://openalex.org/W4402671548","https://openalex.org/W4409762288"],"related_works":[],"abstract_inverted_index":{"Understanding":[0],"individual,":[1,131,142],"group":[2,37,59,86,108,132,143],"and":[3,38,50,61,85,93,101,121,126,133,144,151,180],"event":[4,39,134],"level":[5,40,109,135],"emotions":[6,123],"along":[7],"with":[8,154],"contextual":[9],"information":[10,63],"is":[11,182],"crucial":[12],"for":[13],"analyzing":[14],"a":[15,47],"multi-person":[16,69],"social":[17],"situation.":[18],"To":[19,88],"achieve":[20],"this,":[21],"we":[22,91],"frame":[23],"emotion":[24,33,70,81],"comprehension":[25],"as":[26,128,130],"the":[27,159,173],"task":[28],"of":[29,106,111,161,175],"predicting":[30],"fine-grained":[31],"individual":[32],"to":[34,64,96,117],"coarse":[35],"grained":[36,100],"emotion.":[41],"We":[42,167],"introduce":[43],"GEMS":[44,115,162],"that":[45,169],"leverages":[46],"multimodal":[48],"swin-transformer":[49],"S3Attention":[51],"based":[52,79],"architecture,":[53],"which":[54],"processes":[55],"an":[56],"input":[57],"scene,":[58],"members,":[60],"context":[62],"generate":[65],"joint":[66],"predictions.":[67],"Existing":[68],"related":[71],"benchmarks":[72],"mainly":[73],"focus":[74],"on":[75,80,104,164],"atomic":[76],"interactions":[77],"primarily":[78],"perception":[82],"over":[83],"time":[84],"level.":[87],"this":[89],"end,":[90],"extend":[92],"propose":[94],"VGAF-GEMS":[95,165],"provide":[97],"more":[98],"fine":[99],"holistic":[102],"analysis":[103],"top":[105],"existing":[107],"annotation":[110],"VGAF":[112],"dataset":[113],"[1].":[114],"aims":[116],"predict":[118],"basic":[119],"discrete":[120],"continuous":[122],"(including":[124],"valence":[125],"arousal)":[127],"well":[129],"perceived":[136],"emotions.":[137],"Our":[138],"benchmarking":[139],"effort":[140],"links":[141],"situational":[145],"emotional":[146],"responses":[147],"holistically.":[148],"The":[149,178],"quantitative":[150],"qualitative":[152],"comparisons":[153],"adapted":[155],"state-of-the-art":[156],"models":[157],"demonstrate":[158],"effectiveness":[160],"framework":[163],"benchmarking.":[166],"believe":[168],"it":[170],"will":[171],"pave":[172],"way":[174],"further":[176],"research.":[177],"code":[179],"data":[181],"available":[183],"at:":[184],"https://github.com/katariaak579/GEMS":[185]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-24T00:00:00"}
