{"id":"https://openalex.org/W2977965380","doi":"https://doi.org/10.1587/transinf.2018edp7383","title":"Cross-Domain Deep Feature Combination for Bird Species Classification with Audio-Visual Data","display_name":"Cross-Domain Deep Feature Combination for Bird Species Classification with Audio-Visual Data","publication_year":2019,"publication_date":"2019-10-01","ids":{"openalex":"https://openalex.org/W2977965380","doi":"https://doi.org/10.1587/transinf.2018edp7383","mag":"2977965380"},"language":"en","primary_location":{"id":"doi:10.1587/transinf.2018edp7383","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transinf.2018edp7383","pdf_url":"https://www.jstage.jst.go.jp/article/transinf/E102.D/10/E102.D_2018EDP7383/_pdf","source":{"id":"https://openalex.org/S2486202937","display_name":"IEICE Transactions on Information and Systems","issn_l":"0916-8532","issn":["0916-8532","1745-1361"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Information and Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://www.jstage.jst.go.jp/article/transinf/E102.D/10/E102.D_2018EDP7383/_pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007514809","display_name":"Naranchimeg Bold","orcid":"https://orcid.org/0000-0003-4152-4305"},"institutions":[{"id":"https://openalex.org/I173009982","display_name":"Iwate University","ror":"https://ror.org/04cd75h10","country_code":"JP","type":"education","lineage":["https://openalex.org/I173009982"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Naranchimeg BOLD","raw_affiliation_strings":["Graduate School of Engineering, Department of Design and Media Technology, Iwate University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graduate School of Engineering, Department of Design and Media Technology, Iwate University","institution_ids":["https://openalex.org/I173009982"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089283853","display_name":"Chao Zhang","orcid":"https://orcid.org/0000-0002-0845-9217"},"institutions":[{"id":"https://openalex.org/I111966504","display_name":"University of Fukui","ror":"https://ror.org/00msqp585","country_code":"JP","type":"education","lineage":["https://openalex.org/I111966504"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Chao ZHANG","raw_affiliation_strings":["Graduate School of Engineering, Information Science, University of Fukui"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graduate School of Engineering, Information Science, University of Fukui","institution_ids":["https://openalex.org/I111966504"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5045648943","display_name":"Takuya Akashi","orcid":"https://orcid.org/0000-0001-9177-7306"},"institutions":[{"id":"https://openalex.org/I173009982","display_name":"Iwate University","ror":"https://ror.org/04cd75h10","country_code":"JP","type":"education","lineage":["https://openalex.org/I173009982"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Takuya AKASHI","raw_affiliation_strings":["Graduate School of Engineering, Department of Design and Media Technology, Iwate University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graduate School of Engineering, Department of Design and Media Technology, Iwate University","institution_ids":["https://openalex.org/I173009982"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.6267,"has_fulltext":true,"cited_by_count":22,"citation_normalized_percentile":{"value":0.80875831,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"E102.D","issue":"10","first_page":"2033","last_page":"2042"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11665","display_name":"Animal Vocal Communication and Behavior","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1309","display_name":"Developmental Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11665","display_name":"Animal Vocal Communication and Behavior","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1309","display_name":"Developmental Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9919999837875366,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10199","display_name":"Wildlife Ecology and Conservation","score":0.967199981212616,"subfield":{"id":"https://openalex.org/subfields/2303","display_name":"Ecology"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8778330683708191},{"id":"https://openalex.org/keywords/spectrogram","display_name":"Spectrogram","score":0.7628433704376221},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.7035094499588013},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.6703124046325684},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6227389574050903},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5988055467605591},{"id":"https://openalex.org/keywords/data-set","display_name":"Data set","score":0.5358262062072754},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5238081216812134},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5165857076644897},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4604876637458801},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.44157612323760986},{"id":"https://openalex.org/keywords/data-type","display_name":"Data type","score":0.4293581247329712},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.42591673135757446},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.4233609437942505},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3464467227458954}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8778330683708191},{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.7628433704376221},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.7035094499588013},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.6703124046325684},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6227389574050903},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5988055467605591},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.5358262062072754},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5238081216812134},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5165857076644897},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4604876637458801},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.44157612323760986},{"id":"https://openalex.org/C138958017","wikidata":"https://www.wikidata.org/wiki/Q190087","display_name":"Data type","level":2,"score":0.4293581247329712},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.42591673135757446},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.4233609437942505},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3464467227458954},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1587/transinf.2018edp7383","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transinf.2018edp7383","pdf_url":"https://www.jstage.jst.go.jp/article/transinf/E102.D/10/E102.D_2018EDP7383/_pdf","source":{"id":"https://openalex.org/S2486202937","display_name":"IEICE Transactions on Information and Systems","issn_l":"0916-8532","issn":["0916-8532","1745-1361"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Information and Systems","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1587/transinf.2018edp7383","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transinf.2018edp7383","pdf_url":"https://www.jstage.jst.go.jp/article/transinf/E102.D/10/E102.D_2018EDP7383/_pdf","source":{"id":"https://openalex.org/S2486202937","display_name":"IEICE Transactions on Information and Systems","issn_l":"0916-8532","issn":["0916-8532","1745-1361"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Information and Systems","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.7300000190734863,"id":"https://metadata.un.org/sdg/15","display_name":"Life in Land"}],"awards":[{"id":"https://openalex.org/G2424557075","display_name":null,"funder_award_id":"JP16K01647","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G7240787011","display_name":null,"funder_award_id":"JP19K11515","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G8601184843","display_name":null,"funder_award_id":"JP16KK0069","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"}],"funders":[{"id":"https://openalex.org/F4320334764","display_name":"Japan Society for the Promotion of Science","ror":"https://ror.org/00hhkn466"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2977965380.pdf","grobid_xml":"https://content.openalex.org/works/W2977965380.grobid-xml"},"referenced_works_count":51,"referenced_works":["https://openalex.org/W56385144","https://openalex.org/W154472438","https://openalex.org/W1616462885","https://openalex.org/W1797268635","https://openalex.org/W1832693441","https://openalex.org/W1846473900","https://openalex.org/W1916445035","https://openalex.org/W1984514441","https://openalex.org/W1995562189","https://openalex.org/W2014102544","https://openalex.org/W2022799064","https://openalex.org/W2053101950","https://openalex.org/W2076462394","https://openalex.org/W2097117768","https://openalex.org/W2112739286","https://openalex.org/W2120480077","https://openalex.org/W2131929175","https://openalex.org/W2132791018","https://openalex.org/W2147800946","https://openalex.org/W2154579312","https://openalex.org/W2155893237","https://openalex.org/W2156303437","https://openalex.org/W2158899491","https://openalex.org/W2160815625","https://openalex.org/W2163605009","https://openalex.org/W2164587673","https://openalex.org/W2170240176","https://openalex.org/W2184188583","https://openalex.org/W2194775991","https://openalex.org/W2210322478","https://openalex.org/W2212106655","https://openalex.org/W2388114291","https://openalex.org/W2511428026","https://openalex.org/W2570915410","https://openalex.org/W2576474710","https://openalex.org/W2593610980","https://openalex.org/W2603597171","https://openalex.org/W2606128082","https://openalex.org/W2610961739","https://openalex.org/W2619383789","https://openalex.org/W2630245091","https://openalex.org/W2696731410","https://openalex.org/W2734984521","https://openalex.org/W2751971575","https://openalex.org/W2785420330","https://openalex.org/W2808566528","https://openalex.org/W2962798895","https://openalex.org/W2963012544","https://openalex.org/W2963956866","https://openalex.org/W3099903704","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W2530685530","https://openalex.org/W4375868962","https://openalex.org/W2088854863","https://openalex.org/W2011227383","https://openalex.org/W1976719989","https://openalex.org/W2942893872","https://openalex.org/W2065606036","https://openalex.org/W3179495260","https://openalex.org/W2440023763","https://openalex.org/W2962474440"],"abstract_inverted_index":{"In":[0,39,131],"recent":[1],"decade,":[2],"many":[3],"state-of-the-art":[4],"algorithms":[5],"on":[6,46,104,141],"image":[7,118],"classification":[8,13,193],"as":[9,11],"well":[10],"audio":[12,59,120,152],"have":[14],"achieved":[15],"noticeable":[16],"successes":[17],"with":[18,155,176],"the":[19,30,52,89,105,127,132,138,158,168,192],"development":[20],"of":[21,29,36,54,81,91,99,170,181],"deep":[22],"convolutional":[23],"neural":[24],"network":[25,139],"(CNN).":[26],"However,":[27],"most":[28],"works":[31],"only":[32,113,177],"exploit":[33],"single":[34],"type":[35,180],"training":[37,93],"data.":[38,182],"this":[40],"paper,":[41],"we":[42,72,108,134],"present":[43],"a":[44,142,164],"study":[45],"classifying":[47],"bird":[48],"species":[49],"by":[50],"exploiting":[51],"combination":[53,169],"both":[55,171],"visual":[56],"(images)":[57],"and":[58,119,136],"(sounds)":[60],"data":[61,94,121,146,153,159,172],"using":[62],"CNN,":[63],"which":[64,166],"has":[65],"been":[66],"sparsely":[67],"treated":[68],"so":[69],"far.":[70],"Specifically,":[71],"propose":[73],"CNN-based":[74],"multimodal":[75],"learning":[76,188],"models":[77,174],"in":[78],"three":[79],"types":[80],"fusion":[82],"strategies":[83],"(early,":[84],"middle,":[85],"late)":[86],"to":[87,114,125,157],"settle":[88],"issues":[90],"combining":[92],"cross":[95],"domains.":[96],"The":[97],"advantage":[98],"our":[100,149],"proposed":[101],"method":[102],"lies":[103],"fact":[106],"that":[107,163,186],"can":[109,189],"utilize":[110],"CNN":[111],"not":[112],"extract":[115],"features":[116,128],"from":[117],"(spectrogram)":[122],"but":[123],"also":[124,184],"combine":[126],"across":[129],"modalities.":[130],"experiment,":[133],"train":[135],"evaluate":[137],"structure":[140],"comprehensive":[143],"CUB-200-2011":[144],"standard":[145],"set":[147,154],"combing":[148],"originally":[150],"collected":[151],"respect":[156],"species.":[160],"We":[161,183],"observe":[162],"model":[165],"utilizes":[167],"outperforms":[173],"trained":[175],"an":[178],"either":[179],"show":[185],"transfer":[187],"significantly":[190],"increase":[191],"performance.":[194]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
