{"id":"https://openalex.org/W3007382154","doi":"https://doi.org/10.1109/asru46091.2019.9003966","title":"Spoken Multiple-Choice Question Answering Using Multimodal Convolutional Neural Networks","display_name":"Spoken Multiple-Choice Question Answering Using Multimodal Convolutional Neural Networks","publication_year":2019,"publication_date":"2019-12-01","ids":{"openalex":"https://openalex.org/W3007382154","doi":"https://doi.org/10.1109/asru46091.2019.9003966","mag":"3007382154"},"language":"en","primary_location":{"id":"doi:10.1109/asru46091.2019.9003966","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru46091.2019.9003966","pdf_url":null,"source":{"id":"https://openalex.org/S4306498489","display_name":"2019 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067529162","display_name":"Shang-Bao Luo","orcid":null},"institutions":[{"id":"https://openalex.org/I154864474","display_name":"National Taiwan University of Science and Technology","ror":"https://ror.org/00q09pe49","country_code":"TW","type":"education","lineage":["https://openalex.org/I154864474"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Shang-Bao Luo","raw_affiliation_strings":["National Taiwan University of Science and Technology, Taiwan"],"affiliations":[{"raw_affiliation_string":"National Taiwan University of Science and Technology, Taiwan","institution_ids":["https://openalex.org/I154864474"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048338308","display_name":"Hung-Shin Lee","orcid":"https://orcid.org/0000-0001-7044-9434"},"institutions":[{"id":"https://openalex.org/I4210098366","display_name":"Institute of Information Science, Academia Sinica","ror":"https://ror.org/00z83z196","country_code":"TW","type":"facility","lineage":["https://openalex.org/I4210098366","https://openalex.org/I84653119"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Hung-Shin Lee","raw_affiliation_strings":["Institute of Information Science, Academia Sinica, Taiwan"],"affiliations":[{"raw_affiliation_string":"Institute of Information Science, Academia Sinica, Taiwan","institution_ids":["https://openalex.org/I4210098366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115603153","display_name":"Kuan\u2010Yu Chen","orcid":"https://orcid.org/0000-0002-6036-2199"},"institutions":[{"id":"https://openalex.org/I154864474","display_name":"National Taiwan University of Science and Technology","ror":"https://ror.org/00q09pe49","country_code":"TW","type":"education","lineage":["https://openalex.org/I154864474"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Kuan-Yu Chen","raw_affiliation_strings":["National Taiwan University of Science and Technology, Taiwan"],"affiliations":[{"raw_affiliation_string":"National Taiwan University of Science and Technology, Taiwan","institution_ids":["https://openalex.org/I154864474"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5071214181","display_name":"Hsin\u2010Min Wang","orcid":"https://orcid.org/0000-0003-3599-5071"},"institutions":[{"id":"https://openalex.org/I4210098366","display_name":"Institute of Information Science, Academia Sinica","ror":"https://ror.org/00z83z196","country_code":"TW","type":"facility","lineage":["https://openalex.org/I4210098366","https://openalex.org/I84653119"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Hsin-Min Wang","raw_affiliation_strings":["Institute of Information Science, Academia Sinica, Taiwan"],"affiliations":[{"raw_affiliation_string":"Institute of Information Science, Academia Sinica, Taiwan","institution_ids":["https://openalex.org/I4210098366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5067529162"],"corresponding_institution_ids":["https://openalex.org/I154864474"],"apc_list":null,"apc_paid":null,"fwci":0.5601,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.76350962,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"5","issue":null,"first_page":"772","last_page":"778"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7421732544898987},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6892976760864258},{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.5900762677192688},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5306882858276367},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4733160734176636},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3754671812057495}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7421732544898987},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6892976760864258},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.5900762677192688},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5306882858276367},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4733160734176636},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3754671812057495}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/asru46091.2019.9003966","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru46091.2019.9003966","pdf_url":null,"source":{"id":"https://openalex.org/S4306498489","display_name":"2019 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1524333225","https://openalex.org/W1564003386","https://openalex.org/W1614298861","https://openalex.org/W1631260214","https://openalex.org/W2125436846","https://openalex.org/W2126776599","https://openalex.org/W2130237711","https://openalex.org/W2131342762","https://openalex.org/W2173361515","https://openalex.org/W2250432970","https://openalex.org/W2250539671","https://openalex.org/W2250595585","https://openalex.org/W2251355301","https://openalex.org/W2252000379","https://openalex.org/W2306803708","https://openalex.org/W2325162016","https://openalex.org/W2493916176","https://openalex.org/W2514741789","https://openalex.org/W2516196286","https://openalex.org/W2521709538","https://openalex.org/W2746097825","https://openalex.org/W2762022354","https://openalex.org/W2771904183","https://openalex.org/W2789078277","https://openalex.org/W2798858969","https://openalex.org/W2799201288","https://openalex.org/W2802201485","https://openalex.org/W2806081754","https://openalex.org/W2885485938","https://openalex.org/W2888867175","https://openalex.org/W2896457183","https://openalex.org/W2899771611","https://openalex.org/W2950577311","https://openalex.org/W2962685689","https://openalex.org/W2962809918","https://openalex.org/W2962854302","https://openalex.org/W2963123047","https://openalex.org/W2963341956","https://openalex.org/W2963403868","https://openalex.org/W2963681467","https://openalex.org/W2963748441","https://openalex.org/W2963900105","https://openalex.org/W2964121744","https://openalex.org/W3104486441","https://openalex.org/W4295253143","https://openalex.org/W4385245566","https://openalex.org/W4387428949","https://openalex.org/W6631190155","https://openalex.org/W6631362777","https://openalex.org/W6636811518","https://openalex.org/W6678890848","https://openalex.org/W6679429981","https://openalex.org/W6739901393","https://openalex.org/W6745159025","https://openalex.org/W6756040250"],"related_works":["https://openalex.org/W2384605597","https://openalex.org/W2387743295","https://openalex.org/W2115758952","https://openalex.org/W3082787378","https://openalex.org/W2136007095","https://openalex.org/W2366230879","https://openalex.org/W3208425359","https://openalex.org/W2349927912","https://openalex.org/W3159777597","https://openalex.org/W3204019825"],"abstract_inverted_index":{"In":[0,131],"a":[1,48,67,75,173,221],"spoken":[2,68,97,127,224],"multiple-choice":[3],"question":[4],"answering":[5],"(MCQA)":[6],"task,":[7],"where":[8],"passages,":[9],"questions,":[10],"and":[11,90,146,153,170,191],"choices":[12],"are":[13,103,138,159],"given":[14],"in":[15,27,120,162,228,237],"the":[16,22,42,54,59,63,100,126,132,144,150,164,167,183,186,189,194,202,211,230,240],"form":[17],"of":[18,44,185,206,213],"speech,":[19],"usually":[20],"only":[21,47],"auto-transcribed":[23],"text":[24,107],"is":[25,176,198],"considered":[26],"system":[28,129],"development.":[29],"The":[30],"acoustic-level":[31,55,60,91,101],"information":[32,56,61,65],"may":[33],"contain":[34],"useful":[35],"cues":[36],"for":[37,66,96,149,178],"answer":[38,197],"prediction.":[39],"However,":[40],"to":[41,87,105,141,188,219],"best":[43],"our":[45],"knowledge,":[46],"few":[49],"studies":[50],"focus":[51],"on":[52,82,201,210],"using":[53],"or":[57,116],"fusing":[58],"with":[62],"text-level":[64,147],"MCQA":[69,128,225],"task.":[70],"Therefore,":[71],"this":[72],"paper":[73],"presents":[74],"hierarchical":[76],"multistage":[77],"multimodal":[78],"(HMM)":[79],"framework":[80,233],"based":[81,200],"convolutional":[83],"neural":[84,94],"networks":[85],"(CNNs)":[86],"integrate":[88],"text-":[89],"statistics":[92,102],"into":[93],"modeling":[95],"MCQA.":[98],"Specifically,":[99],"expected":[104],"offset":[106],"inaccuracies":[108],"caused":[109],"by":[110],"automatic":[111],"speech":[112],"recognition":[113],"(ASR)":[114],"systems":[115],"representation":[117,175],"inadequacy":[118],"lurking":[119],"word":[121],"embedding":[122],"generators,":[123],"thereby":[124],"making":[125],"robust.":[130],"proposed":[133,231],"HMM":[134,232],"framework,":[135],"two":[136],"modalities":[137],"first":[139],"manipulated":[140],"separately":[142],"derive":[143],"acoustic-":[145],"representations":[148,205],"passage,":[151,168],"question,":[152,169],"choices.":[154,171,208],"Next,":[155],"these":[156],"clever":[157],"features":[158],"jointly":[160],"involved":[161],"inferring":[163],"relationships":[165],"among":[166],"Then,":[172],"final":[174,204],"derived":[177],"each":[179],"choice,":[180],"which":[181],"encodes":[182],"relationship":[184],"choice":[187],"passage":[190],"question.":[192],"Finally,":[193],"most":[195],"likely":[196],"determined":[199],"individual":[203],"all":[207],"Evaluated":[209],"data":[212],"\u201cFormosa":[214],"Grand":[215],"Challenge":[216],"-":[217],"Talk":[218],"AI\u201d,":[220],"Mandarin":[222],"Chinese":[223],"contest":[226],"held":[227],"2018,":[229],"achieves":[234],"remarkable":[235],"improvements":[236],"accuracy":[238],"over":[239],"text-only":[241],"baseline.":[242]},"counts_by_year":[{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
