{"id":"https://openalex.org/W3197596377","doi":"https://doi.org/10.21437/interspeech.2021-273","title":"Visual Transformers for Primates Classification and Covid Detection","display_name":"Visual Transformers for Primates Classification and Covid Detection","publication_year":2021,"publication_date":"2021-08-27","ids":{"openalex":"https://openalex.org/W3197596377","doi":"https://doi.org/10.21437/interspeech.2021-273","mag":"3197596377"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2021-273","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2021-273","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2021","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2212.10093","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069846773","display_name":"Steffen Illium","orcid":"https://orcid.org/0000-0003-0021-436X"},"institutions":[{"id":"https://openalex.org/I8204097","display_name":"Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen","ror":"https://ror.org/05591te55","country_code":"DE","type":"education","lineage":["https://openalex.org/I8204097"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Steffen Illium","raw_affiliation_strings":["Mobile and Distributed Systems Group, LMU Munich"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Mobile and Distributed Systems Group, LMU Munich","institution_ids":["https://openalex.org/I8204097"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052914309","display_name":"Robert M\u00fcller","orcid":"https://orcid.org/0000-0003-3108-713X"},"institutions":[{"id":"https://openalex.org/I8204097","display_name":"Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen","ror":"https://ror.org/05591te55","country_code":"DE","type":"education","lineage":["https://openalex.org/I8204097"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Robert M\u00fcller","raw_affiliation_strings":["Mobile and Distributed Systems Group, LMU Munich"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Mobile and Distributed Systems Group, LMU Munich","institution_ids":["https://openalex.org/I8204097"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024006892","display_name":"Andreas Sedlmeier","orcid":null},"institutions":[{"id":"https://openalex.org/I8204097","display_name":"Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen","ror":"https://ror.org/05591te55","country_code":"DE","type":"education","lineage":["https://openalex.org/I8204097"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Andreas Sedlmeier","raw_affiliation_strings":["Mobile and Distributed Systems Group, LMU Munich"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Mobile and Distributed Systems Group, LMU Munich","institution_ids":["https://openalex.org/I8204097"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5069249577","display_name":"Claudia-Linnhoff Popien","orcid":null},"institutions":[{"id":"https://openalex.org/I8204097","display_name":"Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen","ror":"https://ror.org/05591te55","country_code":"DE","type":"education","lineage":["https://openalex.org/I8204097"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Claudia-Linnhoff Popien","raw_affiliation_strings":["Mobile and Distributed Systems Group, LMU Munich"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Mobile and Distributed Systems Group, LMU Munich","institution_ids":["https://openalex.org/I8204097"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.3898,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.81703153,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"451","last_page":"455"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9905999898910522,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7427915930747986},{"id":"https://openalex.org/keywords/spectrogram","display_name":"Spectrogram","score":0.7237051129341125},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.7037829160690308},{"id":"https://openalex.org/keywords/weighting","display_name":"Weighting","score":0.6453593969345093},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6031301617622375},{"id":"https://openalex.org/keywords/coronavirus-disease-2019","display_name":"Coronavirus disease 2019 (COVID-19)","score":0.5112237930297852},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.45564302802085876},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.39294612407684326},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3480777144432068},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3241804242134094},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.14206013083457947}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7427915930747986},{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.7237051129341125},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.7037829160690308},{"id":"https://openalex.org/C183115368","wikidata":"https://www.wikidata.org/wiki/Q856577","display_name":"Weighting","level":2,"score":0.6453593969345093},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6031301617622375},{"id":"https://openalex.org/C3008058167","wikidata":"https://www.wikidata.org/wiki/Q84263196","display_name":"Coronavirus disease 2019 (COVID-19)","level":4,"score":0.5112237930297852},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.45564302802085876},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.39294612407684326},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3480777144432068},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3241804242134094},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.14206013083457947},{"id":"https://openalex.org/C142724271","wikidata":"https://www.wikidata.org/wiki/Q7208","display_name":"Pathology","level":1,"score":0.0},{"id":"https://openalex.org/C126838900","wikidata":"https://www.wikidata.org/wiki/Q77604","display_name":"Radiology","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C524204448","wikidata":"https://www.wikidata.org/wiki/Q788926","display_name":"Infectious disease (medical specialty)","level":3,"score":0.0},{"id":"https://openalex.org/C2779134260","wikidata":"https://www.wikidata.org/wiki/Q12136","display_name":"Disease","level":2,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.21437/interspeech.2021-273","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2021-273","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2021","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2212.10093","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2212.10093","pdf_url":"https://arxiv.org/pdf/2212.10093","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2212.10093","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2212.10093","pdf_url":"https://arxiv.org/pdf/2212.10093","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.7200000286102295,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W114730584","https://openalex.org/W197865394","https://openalex.org/W1686810756","https://openalex.org/W1836465849","https://openalex.org/W1972567154","https://openalex.org/W2059652044","https://openalex.org/W2194775991","https://openalex.org/W2405274704","https://openalex.org/W2526050071","https://openalex.org/W2529337537","https://openalex.org/W2899663614","https://openalex.org/W2908510526","https://openalex.org/W2914166397","https://openalex.org/W2962897394","https://openalex.org/W3015995734","https://openalex.org/W3035378948","https://openalex.org/W3094502228","https://openalex.org/W3097426020","https://openalex.org/W3134945014","https://openalex.org/W3198909755","https://openalex.org/W4309793872","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W2530685530","https://openalex.org/W4375868962","https://openalex.org/W2011227383","https://openalex.org/W2088854863","https://openalex.org/W4402568167","https://openalex.org/W3179495260","https://openalex.org/W1976719989","https://openalex.org/W3127543252","https://openalex.org/W2897924318","https://openalex.org/W2138997758"],"abstract_inverted_index":{"We":[0,48],"apply":[1],"the":[2,12,56],"vision":[3],"transformer,":[4],"a":[5],"deep":[6],"machine":[7],"learning":[8],"model":[9,46],"build":[10],"around":[11],"attention":[13],"mechanism,":[14],"on":[15,34],"mel-spectrogram":[16],"representations":[17],"of":[18,41,58],"raw":[19],"audio":[20,63],"recordings.":[21],"When":[22],"adding":[23],"mel-based":[24],"data":[25],"augmentation":[26],"techniques":[27],"and":[28,37,54],"sample-weighting,":[29],"we":[30],"achieve":[31],"comparable":[32],"performance":[33],"both":[35],"(PRS":[36],"CCS":[38],"challenge)":[39],"tasks":[40],"ComParE21,":[42],"outperforming":[43],"most":[44],"single":[45],"baselines.":[47],"further":[49],"introduce":[50],"overlapping":[51],"vertical":[52],"patching":[53],"evaluate":[55],"influence":[57],"parameter":[59],"configurations.":[60],"Index":[61],"Terms:":[62],"classification,":[64],"attention,":[65],"mel-spectrogram,":[66],"unbalanced":[67],"data-sets,":[68],"computational":[69],"paralinguistics":[70]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":4}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
