{"id":"https://openalex.org/W4415593855","doi":"https://doi.org/10.1109/access.2025.3625120","title":"Multi-Modal Understanding of FOMC Press Conferences for Question Generation via Visual and Textual Cues","display_name":"Multi-Modal Understanding of FOMC Press Conferences for Question Generation via Visual and Textual Cues","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4415593855","doi":"https://doi.org/10.1109/access.2025.3625120"},"language":"en","primary_location":{"id":"doi:10.1109/access.2025.3625120","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3625120","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2025.3625120","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5071285744","display_name":"Khaled Alnuaimi","orcid":null},"institutions":[{"id":"https://openalex.org/I176601375","display_name":"Khalifa University of Science and Technology","ror":"https://ror.org/05hffr360","country_code":"AE","type":"education","lineage":["https://openalex.org/I176601375"]}],"countries":["AE"],"is_corresponding":false,"raw_author_name":"Khaled Alnuaimi","raw_affiliation_strings":["Abu Dhabi Investment Authority (ADIA), Abu Dhabi, United Arab Emirates","Department of Computer Science, Khalifa University, Abu Dhabi, United Arab Emirates"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Abu Dhabi Investment Authority (ADIA), Abu Dhabi, United Arab Emirates","institution_ids":[]},{"raw_affiliation_string":"Department of Computer Science, Khalifa University, Abu Dhabi, United Arab Emirates","institution_ids":["https://openalex.org/I176601375"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036034478","display_name":"Mohamad Alansari","orcid":"https://orcid.org/0000-0003-2960-2972"},"institutions":[{"id":"https://openalex.org/I176601375","display_name":"Khalifa University of Science and Technology","ror":"https://ror.org/05hffr360","country_code":"AE","type":"education","lineage":["https://openalex.org/I176601375"]}],"countries":["AE"],"is_corresponding":false,"raw_author_name":"Mohamad Alansari","raw_affiliation_strings":["Department of Computer Science, Khalifa University, Abu Dhabi, United Arab Emirates"],"raw_orcid":"https://orcid.org/0000-0003-2960-2972","affiliations":[{"raw_affiliation_string":"Department of Computer Science, Khalifa University, Abu Dhabi, United Arab Emirates","institution_ids":["https://openalex.org/I176601375"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018399483","display_name":"Mohammed Salah","orcid":"https://orcid.org/0000-0003-1646-7919"},"institutions":[{"id":"https://openalex.org/I176601375","display_name":"Khalifa University of Science and Technology","ror":"https://ror.org/05hffr360","country_code":"AE","type":"education","lineage":["https://openalex.org/I176601375"]}],"countries":["AE"],"is_corresponding":false,"raw_author_name":"Mohammed Salah","raw_affiliation_strings":["Department of Computer Science, Khalifa University, Abu Dhabi, United Arab Emirates"],"raw_orcid":"https://orcid.org/0000-0003-1646-7919","affiliations":[{"raw_affiliation_string":"Department of Computer Science, Khalifa University, Abu Dhabi, United Arab Emirates","institution_ids":["https://openalex.org/I176601375"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028846094","display_name":"Hasan Al-Marzouqi","orcid":"https://orcid.org/0000-0002-2826-1515"},"institutions":[{"id":"https://openalex.org/I176601375","display_name":"Khalifa University of Science and Technology","ror":"https://ror.org/05hffr360","country_code":"AE","type":"education","lineage":["https://openalex.org/I176601375"]}],"countries":["AE"],"is_corresponding":false,"raw_author_name":"Hasan Al Marzouqi","raw_affiliation_strings":["Department of Computer Science, Khalifa University, Abu Dhabi, United Arab Emirates"],"raw_orcid":"https://orcid.org/0000-0002-2826-1515","affiliations":[{"raw_affiliation_string":"Department of Computer Science, Khalifa University, Abu Dhabi, United Arab Emirates","institution_ids":["https://openalex.org/I176601375"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075543445","display_name":"Andreas Henschel","orcid":"https://orcid.org/0000-0003-1386-5372"},"institutions":[{"id":"https://openalex.org/I176601375","display_name":"Khalifa University of Science and Technology","ror":"https://ror.org/05hffr360","country_code":"AE","type":"education","lineage":["https://openalex.org/I176601375"]}],"countries":["AE"],"is_corresponding":false,"raw_author_name":"Andreas Henschel","raw_affiliation_strings":["Department of Computer Science, Khalifa University, Abu Dhabi, United Arab Emirates"],"raw_orcid":"https://orcid.org/0000-0003-1386-5372","affiliations":[{"raw_affiliation_string":"Department of Computer Science, Khalifa University, Abu Dhabi, United Arab Emirates","institution_ids":["https://openalex.org/I176601375"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14626641,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"13","issue":null,"first_page":"184059","last_page":"184070"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9848999977111816,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9848999977111816,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9846000075340271,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9412000179290771,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6672000288963318},{"id":"https://openalex.org/keywords/gesture","display_name":"Gesture","score":0.6420999765396118},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.5748000144958496},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.4943000078201294},{"id":"https://openalex.org/keywords/monetary-policy","display_name":"Monetary policy","score":0.41510000824928284},{"id":"https://openalex.org/keywords/semantic-similarity","display_name":"Semantic similarity","score":0.3481000065803528},{"id":"https://openalex.org/keywords/work","display_name":"Work (physics)","score":0.336899995803833}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7311999797821045},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6672000288963318},{"id":"https://openalex.org/C207347870","wikidata":"https://www.wikidata.org/wiki/Q371174","display_name":"Gesture","level":2,"score":0.6420999765396118},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.5748000144958496},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.4943000078201294},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4366999864578247},{"id":"https://openalex.org/C126285488","wikidata":"https://www.wikidata.org/wiki/Q178476","display_name":"Monetary policy","level":2,"score":0.41510000824928284},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39649999141693115},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.3481000065803528},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.336899995803833},{"id":"https://openalex.org/C19244329","wikidata":"https://www.wikidata.org/wiki/Q208697","display_name":"Financial market","level":2,"score":0.32910001277923584},{"id":"https://openalex.org/C189722922","wikidata":"https://www.wikidata.org/wiki/Q667481","display_name":"Open market operation","level":3,"score":0.29120001196861267},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.27300000190734863},{"id":"https://openalex.org/C2983448237","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Language understanding","level":2,"score":0.2635999917984009},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.25859999656677246},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.2565999925136566},{"id":"https://openalex.org/C67277372","wikidata":"https://www.wikidata.org/wiki/Q7449085","display_name":"Semantic role labeling","level":3,"score":0.25}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2025.3625120","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3625120","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:163469ef9277468daa3d9940c44b0728","is_oa":true,"landing_page_url":"https://doaj.org/article/163469ef9277468daa3d9940c44b0728","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 13, Pp 184059-184070 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2025.3625120","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3625120","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320322334","display_name":"Khalifa University of Science, Technology and Research","ror":"https://ror.org/05hffr360"},{"id":"https://openalex.org/F4320322924","display_name":"Changsha University of Science\u00a0and\u00a0Technology","ror":"https://ror.org/03yph8055"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Federal":[0],"Open":[1],"Market":[2],"Committee":[3],"(FOMC)":[4],"press":[5,42,99],"conferences":[6,43],"represent":[7],"critical":[8],"information":[9],"channels":[10],"through":[11],"which":[12],"monetary":[13],"policy":[14,35],"decisions":[15],"impact":[16],"financial":[17,75],"markets.":[18],"In":[19],"the":[20,157],"FOMC":[21,41],"context,":[22],"Question":[23],"Generation":[24],"(QG)":[25],"plays":[26],"an":[27],"important":[28],"role":[29],"in":[30],"probing":[31],"economic":[32],"outlooks":[33],"and":[34,56,81,110,121,137,153],"intentions.":[36],"Traditional":[37],"analysis":[38],"methods":[39],"of":[40,98,159],"focused":[44],"solely":[45],"on":[46],"textual":[47,80],"content,":[48],"while":[49],"visual":[50,82,160],"features":[51],"such":[52],"as":[53],"facial":[54],"expressions":[55],"gestures":[57],"encode":[58],"valuable,":[59],"complementary":[60],"signals.":[61],"To":[62,84],"address":[63],"this":[64,66,86,114],"limitation,":[65],"work":[67],"proposes":[68],"leveraging":[69],"Vision-Language":[70],"Models":[71],"(VLMs)":[72],"for":[73],"enhanced":[74],"QG":[76],"by":[77],"jointly":[78],"modeling":[79],"modalities.":[83],"support":[85],"approach,":[87],"we":[88],"introduce":[89],"FOMC-QA,":[90],"a":[91],"large-scale":[92],"multi-modal":[93],"dataset":[94],"comprising":[95],"40":[96],"hours":[97],"conference":[100],"video":[101],"segments":[102],"aligned":[103],"with":[104],"their":[105,127,146],"corresponding":[106],"transcripts,":[107],"context":[108],"paragraphs,":[109],"audience":[111],"questions.":[112],"Using":[113],"dataset,":[115],"state-of-the-art":[116],"(SOTA)":[117],"VLMs":[118,144],"(Sa2VA,":[119],"VideoGLaMM,":[120],"Video-ChatGPT)":[122],"are":[123],"rigorously":[124],"benchmarked":[125],"against":[126],"text-only":[128],"Large":[129],"Language":[130],"Model":[131],"(LLM)":[132],"counterparts":[133],"(Qwen2.5,":[134],"Phi-3":[135],"Mini,":[136],"Vicuna).":[138],"The":[139],"obtained":[140],"results":[141],"show":[142],"that":[143],"outperform":[145],"LLM-only":[147],"versions":[148],"across":[149],"both":[150],"semantic":[151],"similarity":[152],"question":[154],"relevance,":[155],"highlighting":[156],"benefit":[158],"grounding.":[161]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-28T00:00:00"}
