{"id":"https://openalex.org/W2767915528","doi":"https://doi.org/10.1145/3136755.3143005","title":"Multi-modal emotion recognition using semi-supervised learning and multiple neural networks in the wild","display_name":"Multi-modal emotion recognition using semi-supervised learning and multiple neural networks in the wild","publication_year":2017,"publication_date":"2017-11-03","ids":{"openalex":"https://openalex.org/W2767915528","doi":"https://doi.org/10.1145/3136755.3143005","mag":"2767915528"},"language":"en","primary_location":{"id":"doi:10.1145/3136755.3143005","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3136755.3143005","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th ACM International Conference on Multimodal Interaction","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102999178","display_name":"Dae Ha Kim","orcid":"https://orcid.org/0000-0003-3838-126X"},"institutions":[{"id":"https://openalex.org/I191879574","display_name":"Inha University","ror":"https://ror.org/01easw929","country_code":"KR","type":"education","lineage":["https://openalex.org/I191879574"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Dae Ha Kim","raw_affiliation_strings":["Inha University, South Korea"],"affiliations":[{"raw_affiliation_string":"Inha University, South Korea","institution_ids":["https://openalex.org/I191879574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100398226","display_name":"Min Kyu Lee","orcid":"https://orcid.org/0000-0003-3447-4936"},"institutions":[{"id":"https://openalex.org/I191879574","display_name":"Inha University","ror":"https://ror.org/01easw929","country_code":"KR","type":"education","lineage":["https://openalex.org/I191879574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Min Kyu Lee","raw_affiliation_strings":["Inha University, South Korea"],"affiliations":[{"raw_affiliation_string":"Inha University, South Korea","institution_ids":["https://openalex.org/I191879574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072074332","display_name":"Dong Yoon Choi","orcid":"https://orcid.org/0000-0003-2990-9691"},"institutions":[{"id":"https://openalex.org/I191879574","display_name":"Inha University","ror":"https://ror.org/01easw929","country_code":"KR","type":"education","lineage":["https://openalex.org/I191879574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Dong Yoon Choi","raw_affiliation_strings":["Inha University, South Korea"],"affiliations":[{"raw_affiliation_string":"Inha University, South Korea","institution_ids":["https://openalex.org/I191879574"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5065677543","display_name":"Byung Cheol Song","orcid":"https://orcid.org/0000-0001-8742-3433"},"institutions":[{"id":"https://openalex.org/I191879574","display_name":"Inha University","ror":"https://ror.org/01easw929","country_code":"KR","type":"education","lineage":["https://openalex.org/I191879574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Byung Cheol Song","raw_affiliation_strings":["Inha University, South Korea"],"affiliations":[{"raw_affiliation_string":"Inha University, South Korea","institution_ids":["https://openalex.org/I191879574"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5102999178"],"corresponding_institution_ids":["https://openalex.org/I191879574"],"apc_list":null,"apc_paid":null,"fwci":6.3264,"has_fulltext":false,"cited_by_count":45,"citation_normalized_percentile":{"value":0.96704178,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"529","last_page":"535"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7902661561965942},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7429071068763733},{"id":"https://openalex.org/keywords/landmark","display_name":"Landmark","score":0.6391672492027283},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5674629211425781},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5279157161712646},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4772341549396515},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.47175222635269165},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.458435595035553},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.440976083278656},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4408787488937378},{"id":"https://openalex.org/keywords/emotion-recognition","display_name":"Emotion recognition","score":0.43498510122299194},{"id":"https://openalex.org/keywords/emotion-classification","display_name":"Emotion classification","score":0.43049103021621704},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.41689401865005493},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.39990341663360596},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.39470118284225464}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7902661561965942},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7429071068763733},{"id":"https://openalex.org/C2780297707","wikidata":"https://www.wikidata.org/wiki/Q4895393","display_name":"Landmark","level":2,"score":0.6391672492027283},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5674629211425781},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5279157161712646},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4772341549396515},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.47175222635269165},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.458435595035553},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.440976083278656},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4408787488937378},{"id":"https://openalex.org/C2777438025","wikidata":"https://www.wikidata.org/wiki/Q1339090","display_name":"Emotion recognition","level":2,"score":0.43498510122299194},{"id":"https://openalex.org/C206310091","wikidata":"https://www.wikidata.org/wiki/Q750859","display_name":"Emotion classification","level":2,"score":0.43049103021621704},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.41689401865005493},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.39990341663360596},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.39470118284225464},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3136755.3143005","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3136755.3143005","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th ACM International Conference on Multimodal Interaction","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W830076066","https://openalex.org/W1522734439","https://openalex.org/W1677182931","https://openalex.org/W1686810756","https://openalex.org/W1836465849","https://openalex.org/W1934410531","https://openalex.org/W1966797434","https://openalex.org/W1981918162","https://openalex.org/W2033773055","https://openalex.org/W2039051707","https://openalex.org/W2085662862","https://openalex.org/W2097117768","https://openalex.org/W2097290407","https://openalex.org/W2103943262","https://openalex.org/W2106390385","https://openalex.org/W2108598243","https://openalex.org/W2119821739","https://openalex.org/W2121684305","https://openalex.org/W2132889650","https://openalex.org/W2136504847","https://openalex.org/W2147347517","https://openalex.org/W2154579312","https://openalex.org/W2161969291","https://openalex.org/W2163605009","https://openalex.org/W2191779130","https://openalex.org/W2194775991","https://openalex.org/W2217426128","https://openalex.org/W2341528187","https://openalex.org/W2530816535","https://openalex.org/W2546875627","https://openalex.org/W2548264631","https://openalex.org/W2548529926","https://openalex.org/W2548899748","https://openalex.org/W2618530766","https://openalex.org/W2624871570","https://openalex.org/W2767348466","https://openalex.org/W2951970475","https://openalex.org/W2963446712","https://openalex.org/W2964137095","https://openalex.org/W3101998545","https://openalex.org/W3103757879","https://openalex.org/W6680140577"],"related_works":["https://openalex.org/W4380075502","https://openalex.org/W3094370402","https://openalex.org/W4223943233","https://openalex.org/W4312200629","https://openalex.org/W4360585206","https://openalex.org/W2970216048","https://openalex.org/W4364306694","https://openalex.org/W2724710774","https://openalex.org/W4380086463","https://openalex.org/W4225161397"],"abstract_inverted_index":{"Human":[0],"emotion":[1,109,140],"recognition":[2],"is":[3,8,62,94,105,143],"a":[4,22,44,80,98,168],"research":[5],"topic":[6],"that":[7,116],"receiving":[9],"continuous":[10],"attention":[11],"in":[12,43,160],"computer":[13],"vision":[14],"and":[15,41,70,97],"artificial":[16],"intelligence":[17],"domains.":[18],"This":[19],"paper":[20],"proposes":[21],"method":[23,49,166],"for":[24,82,107,123],"classifying":[25],"human":[26],"emotions":[27],"through":[28],"multiple":[29,149],"neural":[30],"networks":[31],"based":[32,101,112],"on":[33,102,113,155],"multi-modal":[34],"signals":[35,118],"which":[36],"consist":[37],"of":[38,58,77,88,148,171],"image,":[39],"landmark,":[40],"audio":[42,117,129],"wild":[45],"environment.":[46],"The":[47],"proposed":[48,106,165],"has":[50],"the":[51,55,59,74,103,135,152,156,161,164],"following":[52],"features.":[53],"First,":[54],"learning":[56,69,72,131],"performance":[57],"image-based":[60],"network":[61,100],"greatly":[63],"improved":[64],"by":[65],"employing":[66],"both":[67],"multi-task":[68],"semi-supervised":[71],"using":[73],"spatio-temporal":[75],"characteristic":[76],"videos.":[78],"Second,":[79],"model":[81,104],"converting":[83],"1-dimensional":[84],"(1D)":[85],"landmark":[86],"information":[87],"face":[89],"into":[90],"two-dimensional":[91],"(2D)":[92],"images,":[93],"newly":[95],"proposed,":[96],"CNN-LSTM":[99],"better":[108],"recognition.":[110],"Third,":[111],"an":[114,128],"observation":[115],"are":[119],"often":[120],"very":[121],"effective":[122],"specific":[124,136],"emotions,":[125],"we":[126],"propose":[127],"deep":[130],"mechanism":[132],"robust":[133],"to":[134,145],"emotions.":[137],"Finally,":[138],"so-called":[139],"adaptive":[141],"fusion":[142],"applied":[144],"enable":[146],"synergy":[147],"networks.":[150],"In":[151],"fifth":[153],"attempt":[154],"given":[157],"test":[158],"set":[159],"EmotiW2017":[162],"challenge,":[163],"achieved":[167],"classification":[169],"accuracy":[170],"57.12%.":[172]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":8},{"year":2019,"cited_by_count":13},{"year":2018,"cited_by_count":6}],"updated_date":"2026-04-01T17:29:45.350535","created_date":"2025-10-10T00:00:00"}
