{"id":"https://openalex.org/W3211894574","doi":"https://doi.org/10.1109/tmm.2021.3128738","title":"Isotropic Self-Supervised Learning for Driver Drowsiness Detection With Attention-Based Multimodal Fusion","display_name":"Isotropic Self-Supervised Learning for Driver Drowsiness Detection With Attention-Based Multimodal Fusion","publication_year":2021,"publication_date":"2021-11-17","ids":{"openalex":"https://openalex.org/W3211894574","doi":"https://doi.org/10.1109/tmm.2021.3128738","mag":"3211894574"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2021.3128738","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2021.3128738","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013704823","display_name":"Luntian Mou","orcid":"https://orcid.org/0000-0002-1551-4448"},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Luntian Mou","raw_affiliation_strings":["Beijing Key Laboratory of Multimedia and Intelligent Software Technology, Beijing Institute of Artificial Intelligence, Faculty of Information Technology, Beijing University of Technology, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-1551-4448","affiliations":[{"raw_affiliation_string":"Beijing Key Laboratory of Multimedia and Intelligent Software Technology, Beijing Institute of Artificial Intelligence, Faculty of Information Technology, Beijing University of Technology, Beijing, China","institution_ids":["https://openalex.org/I37796252"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101814084","display_name":"Chao Zhou","orcid":"https://orcid.org/0009-0008-7607-3827"},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chao Zhou","raw_affiliation_strings":["Beijing Key Laboratory of Multimedia and Intelligent Software Technology, Beijing Institute of Artificial Intelligence, Faculty of Information Technology, Beijing University of Technology, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Beijing Key Laboratory of Multimedia and Intelligent Software Technology, Beijing Institute of Artificial Intelligence, Faculty of Information Technology, Beijing University of Technology, Beijing, China","institution_ids":["https://openalex.org/I37796252"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083884675","display_name":"Pengtao Xie","orcid":"https://orcid.org/0000-0003-0521-174X"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Pengtao Xie","raw_affiliation_strings":["University of California, San Diego, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California, San Diego, CA, USA","institution_ids":["https://openalex.org/I36258959"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100627236","display_name":"Pengfei Zhao","orcid":"https://orcid.org/0000-0001-6419-6653"},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pengfei Zhao","raw_affiliation_strings":["Beijing Key Laboratory of Multimedia and Intelligent Software Technology, Beijing Institute of Artificial Intelligence, Faculty of Information Technology, Beijing University of Technology, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-6419-6653","affiliations":[{"raw_affiliation_string":"Beijing Key Laboratory of Multimedia and Intelligent Software Technology, Beijing Institute of Artificial Intelligence, Faculty of Information Technology, Beijing University of Technology, Beijing, China","institution_ids":["https://openalex.org/I37796252"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010478919","display_name":"Ramesh Jain","orcid":"https://orcid.org/0000-0003-2373-4966"},"institutions":[{"id":"https://openalex.org/I204250578","display_name":"University of California, Irvine","ror":"https://ror.org/04gyf1771","country_code":"US","type":"education","lineage":["https://openalex.org/I204250578"]},{"id":"https://openalex.org/I4210136895","display_name":"Institute for the Future","ror":"https://ror.org/049tcsg76","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210136895"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ramesh Jain","raw_affiliation_strings":["Institute for Future Health, Bren School of Information and Computer Sciences, University of California, Irvine, CA, USA"],"raw_orcid":"https://orcid.org/0000-0003-2373-4966","affiliations":[{"raw_affiliation_string":"Institute for Future Health, Bren School of Information and Computer Sciences, University of California, Irvine, CA, USA","institution_ids":["https://openalex.org/I4210136895","https://openalex.org/I204250578"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018478553","display_name":"Wen Gao","orcid":"https://orcid.org/0000-0002-8070-802X"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wen Gao","raw_affiliation_strings":["Institute of Digital Media, Peking University, Beijing, China","School of Electronic and Computer Engineering, Peking University Shenzhen Graduate School, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0002-8070-802X","affiliations":[{"raw_affiliation_string":"Institute of Digital Media, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"School of Electronic and Computer Engineering, Peking University Shenzhen Graduate School, Shenzhen, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5020527092","display_name":"Baocai Yin","orcid":"https://orcid.org/0000-0003-3121-1823"},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Baocai Yin","raw_affiliation_strings":["Beijing Key Laboratory of Multimedia and Intelligent Software Technology, Beijing Institute of Artificial Intelligence, Faculty of Information Technology, Beijing University of Technology, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-3121-1823","affiliations":[{"raw_affiliation_string":"Beijing Key Laboratory of Multimedia and Intelligent Software Technology, Beijing Institute of Artificial Intelligence, Faculty of Information Technology, Beijing University of Technology, Beijing, China","institution_ids":["https://openalex.org/I37796252"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.9165,"has_fulltext":false,"cited_by_count":45,"citation_normalized_percentile":{"value":0.95562866,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":"25","issue":null,"first_page":"529","last_page":"542"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11373","display_name":"Sleep and Work-Related Fatigue","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11373","display_name":"Sleep and Work-Related Fatigue","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12597","display_name":"Fire Detection and Safety Systems","score":0.9781000018119812,"subfield":{"id":"https://openalex.org/subfields/2213","display_name":"Safety, Risk, Reliability and Quality"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.95169997215271,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8204307556152344},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7316340208053589},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.6155851483345032},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.5400510430335999},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.530876636505127},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.5132620334625244},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.4973457157611847},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.49072277545928955},{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.48675107955932617},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.44883227348327637},{"id":"https://openalex.org/keywords/multimodal-learning","display_name":"Multimodal learning","score":0.44479769468307495},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.43321558833122253},{"id":"https://openalex.org/keywords/optical-flow","display_name":"Optical flow","score":0.4279637336730957},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4260830283164978},{"id":"https://openalex.org/keywords/fuse","display_name":"Fuse (electrical)","score":0.42111796140670776},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4154531955718994},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.15471529960632324}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8204307556152344},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7316340208053589},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.6155851483345032},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.5400510430335999},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.530876636505127},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.5132620334625244},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.4973457157611847},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.49072277545928955},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.48675107955932617},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.44883227348327637},{"id":"https://openalex.org/C2780660688","wikidata":"https://www.wikidata.org/wiki/Q25052564","display_name":"Multimodal learning","level":2,"score":0.44479769468307495},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.43321558833122253},{"id":"https://openalex.org/C155542232","wikidata":"https://www.wikidata.org/wiki/Q736111","display_name":"Optical flow","level":3,"score":0.4279637336730957},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4260830283164978},{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.42111796140670776},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4154531955718994},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.15471529960632324},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2021.3128738","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2021.3128738","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Good health and well-being","score":0.49000000953674316,"id":"https://metadata.un.org/sdg/3"}],"awards":[{"id":"https://openalex.org/G3621289433","display_name":null,"funder_award_id":"61672068","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":65,"referenced_works":["https://openalex.org/W1566256432","https://openalex.org/W1578985305","https://openalex.org/W1613465282","https://openalex.org/W1902237438","https://openalex.org/W1985867508","https://openalex.org/W1987654648","https://openalex.org/W1989085630","https://openalex.org/W2005749985","https://openalex.org/W2064675550","https://openalex.org/W2077395415","https://openalex.org/W2078039548","https://openalex.org/W2087681821","https://openalex.org/W2094726855","https://openalex.org/W2101956459","https://openalex.org/W2138621090","https://openalex.org/W2157331557","https://openalex.org/W2161969291","https://openalex.org/W2164186291","https://openalex.org/W2164699598","https://openalex.org/W2171221410","https://openalex.org/W2194775991","https://openalex.org/W2272340902","https://openalex.org/W2346607917","https://openalex.org/W2470673105","https://openalex.org/W2487852963","https://openalex.org/W2509901229","https://openalex.org/W2533176898","https://openalex.org/W2604676963","https://openalex.org/W2604772469","https://openalex.org/W2605351369","https://openalex.org/W2609575245","https://openalex.org/W2619383789","https://openalex.org/W2735673432","https://openalex.org/W2767520447","https://openalex.org/W2782396879","https://openalex.org/W2783618220","https://openalex.org/W2798991696","https://openalex.org/W2832876791","https://openalex.org/W2883790098","https://openalex.org/W2894818097","https://openalex.org/W2899973923","https://openalex.org/W2901907199","https://openalex.org/W2909963827","https://openalex.org/W2913033828","https://openalex.org/W2914641625","https://openalex.org/W2967815566","https://openalex.org/W2987741655","https://openalex.org/W2992048516","https://openalex.org/W2997475949","https://openalex.org/W2998388430","https://openalex.org/W3015309989","https://openalex.org/W3023371261","https://openalex.org/W3025665229","https://openalex.org/W3035524453","https://openalex.org/W3043319350","https://openalex.org/W3044774336","https://openalex.org/W3087792975","https://openalex.org/W3099805903","https://openalex.org/W3101227480","https://openalex.org/W3107551614","https://openalex.org/W3128764679","https://openalex.org/W6743596144","https://openalex.org/W6762521896","https://openalex.org/W6774314701","https://openalex.org/W7024581459"],"related_works":["https://openalex.org/W2983142544","https://openalex.org/W2891059443","https://openalex.org/W4281663961","https://openalex.org/W3208888551","https://openalex.org/W4220682630","https://openalex.org/W4313561566","https://openalex.org/W3208386644","https://openalex.org/W3181622257","https://openalex.org/W3133533225","https://openalex.org/W3163146846"],"abstract_inverted_index":{"Driverdrowsiness":[0],"is":[1,45,110,200,220,227],"an":[2,69,88,105,197],"important":[3],"cause":[4],"of":[5,39,79,102,123,165,184,187],"traffic":[6],"accidents.":[7],"Many":[8],"studies":[9,32],"using":[10],"computer":[11],"vision":[12],"techniques":[13],"to":[14,54,75,113,133,175,202,212,229],"detect":[15,230],"driver":[16,231],"drowsiness":[17,57,195,232],"states,":[18],"such":[19],"as":[20],"slow":[21],"blinking,":[22],"yawning,":[23],"and":[24,86,120,150,226,249],"nodding,":[25],"have":[26,33],"demonstrated":[27],"excellent":[28],"potential.":[29],"Although":[30],"existing":[31,252],"made":[34],"significant":[35],"progress,":[36],"the":[37,42,100,117,124,130,135,139,153,162,166,172,181,185,191,205,209,223,246,250],"number":[38],"samples":[40],"in":[41,142],"training":[43],"corpora":[44],"small,":[46],"which":[47],"makes":[48],"it":[49],"difficult":[50],"for":[51,138],"a":[52,217],"model":[53,90,109,132],"learn":[55,76],"effective":[56],"representations":[58,78],"from":[59,116,190,208],"images":[60,80],"or":[61],"videos.":[62],"To":[63,98,179],"address":[64],"this":[65],"issue,":[66],"we":[67,127],"develop":[68],"isotropic":[70],"self-supervised":[71],"learning":[72],"(IsoSSL)":[73],"approach":[74],"powerful":[77],"without":[81],"relying":[82],"on":[83,194,237],"human-provided":[84],"annotations":[85],"propose":[87],"IsoSSL-MoCo":[89,131],"by":[91,161,222],"combining":[92],"IsoSSL":[93],"with":[94],"momentum":[95],"contrast":[96],"(MoCo).":[97],"exploit":[99],"complementarity":[101],"multimodal":[103,107],"data,":[104],"attention-based":[106],"fusion":[108,155],"also":[111],"proposed":[112,154],"fuse":[114],"features":[115,189],"eye,":[118],"mouth,":[119],"optical":[121],"flow":[122],"head.":[125],"Specifically,":[126],"first":[128],"use":[129],"pretrain":[134],"image":[136,163],"encoders":[137,147,164],"three":[140,167,192],"modalities":[141,168,193],"other":[143],"datasets.":[144],"Then,":[145],"these":[146],"are":[148,169],"fine-tuned":[149],"integrated":[151],"into":[152,171],"model.":[156],"The":[157],"feature":[158,206],"vectors":[159,207],"generated":[160,221],"fed":[170],"recursive":[173,210],"layer":[174,211,225],"extract":[176],"temporal":[177,188],"information.":[178],"capture":[180],"importance":[182],"degrees":[183],"effects":[186],"detection,":[196],"attention":[198,224],"mechanism":[199],"introduced":[201],"automatically":[203],"weigh":[204],"improve":[213],"detection":[214],"accuracy.":[215],"Finally,":[216],"vector":[218],"representation":[219],"used":[228],"states.":[233],"Experimental":[234],"results":[235],"based":[236],"two":[238],"challenging":[239],"datasets":[240],"show":[241],"that":[242],"our":[243],"method":[244],"outperforms":[245],"baseline":[247],"methods":[248],"latest":[251],"methods.":[253]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":14},{"year":2024,"cited_by_count":14},{"year":2023,"cited_by_count":9},{"year":2022,"cited_by_count":4}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
