{"id":"https://openalex.org/W4387619800","doi":"https://doi.org/10.15439/2023f4192","title":"Multimodal Neural Networks in the Problem of Captioning Images in Newspapers","display_name":"Multimodal Neural Networks in the Problem of Captioning Images in Newspapers","publication_year":2023,"publication_date":"2023-09-26","ids":{"openalex":"https://openalex.org/W4387619800","doi":"https://doi.org/10.15439/2023f4192"},"language":"en","primary_location":{"id":"doi:10.15439/2023f4192","is_oa":true,"landing_page_url":"http://dx.doi.org/10.15439/2023f4192","pdf_url":"https://annals-csis.org/proceedings/2023/drp/pdf/4192.pdf","source":{"id":"https://openalex.org/S4220651875","display_name":"Annals of Computer Science and Information Systems","issn_l":"2300-5963","issn":["2300-5963"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":"https://openalex.org/P4310317484","host_organization_name":"Polskie Towarzystwo Informatyczne","host_organization_lineage":["https://openalex.org/P4310317484"],"host_organization_lineage_names":["Polskie Towarzystwo Informatyczne"],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Annals of Computer Science and Information Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://annals-csis.org/proceedings/2023/drp/pdf/4192.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045060547","display_name":"Patryk Kaszuba","orcid":null},"institutions":[{"id":"https://openalex.org/I59411706","display_name":"Adam Mickiewicz University in Pozna\u0144","ror":"https://ror.org/04g6bbq64","country_code":"PL","type":"education","lineage":["https://openalex.org/I59411706"]}],"countries":["PL"],"is_corresponding":true,"raw_author_name":"Patryk Kaszuba","raw_affiliation_strings":["Faculty of Mathematics and Computer Science Adam Mickiewicz University Pozna , Poland","Faculty of Mathematics and Computer Science Adam Mickiewicz University Pozna, Poland","Faculty of Mathematics and Computer Science Adam Mickiewicz University Pozna\u0144, Poland"],"affiliations":[{"raw_affiliation_string":"Faculty of Mathematics and Computer Science Adam Mickiewicz University Pozna , Poland","institution_ids":["https://openalex.org/I59411706"]},{"raw_affiliation_string":"Faculty of Mathematics and Computer Science Adam Mickiewicz University Pozna, Poland","institution_ids":["https://openalex.org/I59411706"]},{"raw_affiliation_string":"Faculty of Mathematics and Computer Science Adam Mickiewicz University Pozna\u0144, Poland","institution_ids":["https://openalex.org/I59411706"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5045060547"],"corresponding_institution_ids":["https://openalex.org/I59411706"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14345638,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"35","issue":null,"first_page":"1337","last_page":"1340"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9269000291824341,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9269000291824341,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9016000032424927,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.9529314637184143},{"id":"https://openalex.org/keywords/newspaper","display_name":"Newspaper","score":0.7833907604217529},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7528529763221741},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5769421458244324},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4663863182067871},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.3858751356601715},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.33355921506881714},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.33079373836517334},{"id":"https://openalex.org/keywords/advertising","display_name":"Advertising","score":0.11769276857376099},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.06503358483314514}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.9529314637184143},{"id":"https://openalex.org/C201280247","wikidata":"https://www.wikidata.org/wiki/Q11032","display_name":"Newspaper","level":2,"score":0.7833907604217529},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7528529763221741},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5769421458244324},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4663863182067871},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.3858751356601715},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.33355921506881714},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.33079373836517334},{"id":"https://openalex.org/C112698675","wikidata":"https://www.wikidata.org/wiki/Q37038","display_name":"Advertising","level":1,"score":0.11769276857376099},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.06503358483314514}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.15439/2023f4192","is_oa":true,"landing_page_url":"http://dx.doi.org/10.15439/2023f4192","pdf_url":"https://annals-csis.org/proceedings/2023/drp/pdf/4192.pdf","source":{"id":"https://openalex.org/S4220651875","display_name":"Annals of Computer Science and Information Systems","issn_l":"2300-5963","issn":["2300-5963"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":"https://openalex.org/P4310317484","host_organization_name":"Polskie Towarzystwo Informatyczne","host_organization_lineage":["https://openalex.org/P4310317484"],"host_organization_lineage_names":["Polskie Towarzystwo Informatyczne"],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Annals of Computer Science and Information Systems","raw_type":"proceedings-article"},{"id":"pmh:oai:doaj.org/article:079bd967400e4cf5bfef06ca11e75211","is_oa":true,"landing_page_url":"https://doaj.org/article/079bd967400e4cf5bfef06ca11e75211","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Annals of computer science and information systems, Vol 35, Pp 1337-1340 (2023)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.15439/2023f4192","is_oa":true,"landing_page_url":"http://dx.doi.org/10.15439/2023f4192","pdf_url":"https://annals-csis.org/proceedings/2023/drp/pdf/4192.pdf","source":{"id":"https://openalex.org/S4220651875","display_name":"Annals of Computer Science and Information Systems","issn_l":"2300-5963","issn":["2300-5963"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":"https://openalex.org/P4310317484","host_organization_name":"Polskie Towarzystwo Informatyczne","host_organization_lineage":["https://openalex.org/P4310317484"],"host_organization_lineage_names":["Polskie Towarzystwo Informatyczne"],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Annals of Computer Science and Information Systems","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Decent work and economic growth","id":"https://metadata.un.org/sdg/8","score":0.4099999964237213}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4387619800.pdf","grobid_xml":"https://content.openalex.org/works/W4387619800.grobid-xml"},"referenced_works_count":28,"referenced_works":["https://openalex.org/W1895577753","https://openalex.org/W1897761818","https://openalex.org/W1905882502","https://openalex.org/W2109586012","https://openalex.org/W2729842244","https://openalex.org/W2913090763","https://openalex.org/W2974212192","https://openalex.org/W2995435108","https://openalex.org/W3016923549","https://openalex.org/W3038476992","https://openalex.org/W3090449556","https://openalex.org/W3091588028","https://openalex.org/W3103455452","https://openalex.org/W3126337491","https://openalex.org/W3135367836","https://openalex.org/W3166396011","https://openalex.org/W3177525997","https://openalex.org/W4281758439","https://openalex.org/W4287855079","https://openalex.org/W4306820534","https://openalex.org/W4361194507","https://openalex.org/W4386065512","https://openalex.org/W4386076084","https://openalex.org/W6603806335","https://openalex.org/W6639657675","https://openalex.org/W6755136841","https://openalex.org/W6847386724","https://openalex.org/W6928992657"],"related_works":["https://openalex.org/W4210416330","https://openalex.org/W2949362007","https://openalex.org/W3164229987","https://openalex.org/W3215212336","https://openalex.org/W4290852288","https://openalex.org/W3122720459","https://openalex.org/W4298897568","https://openalex.org/W1938708284","https://openalex.org/W4380190185","https://openalex.org/W4387608643"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"the":[3,23,34,63,74],"effectiveness":[4],"of":[5,33,57,66,76],"different":[6],"multimodal":[7,79],"neural":[8],"networks":[9],"in":[10],"captioning":[11,68],"newspaper":[12],"scan":[13],"images.These":[14],"methods":[15,80],"were":[16],"evaluated":[17],"on":[18],"a":[19,31,42,46,50,54],"dataset":[20],"created":[21],"for":[22,45,81],"Temporal":[24],"Image":[25],"Caption":[26],"Retrieval":[27],"Competition,":[28],"which":[29],"is":[30],"part":[32],"FedCSIS":[35],"2023":[36],"conference.The":[37],"task":[38],"was":[39],"to":[40],"predict":[41],"relevant":[43],"caption":[44],"picture":[47],"taken":[48],"from":[49,53],"newspaper,":[51],"chosen":[52],"given":[55],"list":[56],"captions.The":[58],"results":[59],"we":[60],"obtained":[61],"show":[62],"promising":[64],"potential":[65],"image":[67],"using":[69],"CLIP":[70],"architectures":[71],"and":[72],"emphasize":[73],"importance":[75],"developing":[77],"new":[78],"problems":[82],"that":[83],"combine":[84],"multiple":[85],"disciplines,":[86],"such":[87],"as":[88],"computer":[89],"vision":[90],"with":[91],"natural":[92],"language":[93],"processing.":[94]},"counts_by_year":[],"updated_date":"2026-03-07T13:37:22.277990","created_date":"2025-10-10T00:00:00"}
