{"id":"https://openalex.org/W4381094892","doi":"https://doi.org/10.1007/s00521-023-08744-1","title":"Improved Arabic image captioning model using feature concatenation with pre-trained word embedding","display_name":"Improved Arabic image captioning model using feature concatenation with pre-trained word embedding","publication_year":2023,"publication_date":"2023-06-17","ids":{"openalex":"https://openalex.org/W4381094892","doi":"https://doi.org/10.1007/s00521-023-08744-1"},"language":"en","primary_location":{"id":"doi:10.1007/s00521-023-08744-1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00521-023-08744-1","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00521-023-08744-1.pdf","source":{"id":"https://openalex.org/S147897268","display_name":"Neural Computing and Applications","issn_l":"0941-0643","issn":["0941-0643","1433-3058"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computing and Applications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s00521-023-08744-1.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040420095","display_name":"Samar Elbedwehy","orcid":"https://orcid.org/0000-0002-2187-0174"},"institutions":[{"id":"https://openalex.org/I130309236","display_name":"Kafrelsheikh University","ror":"https://ror.org/04a97mm30","country_code":"EG","type":"education","lineage":["https://openalex.org/I130309236"]}],"countries":["EG"],"is_corresponding":true,"raw_author_name":"Samar Elbedwehy","raw_affiliation_strings":["Department of Data Science, Faculty of Artificial Intelligence, Kafrelsheikh University, Kafr El Sheikh, Egypt"],"raw_orcid":"https://orcid.org/0000-0002-2187-0174","affiliations":[{"raw_affiliation_string":"Department of Data Science, Faculty of Artificial Intelligence, Kafrelsheikh University, Kafr El Sheikh, Egypt","institution_ids":["https://openalex.org/I130309236"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022601935","display_name":"T. Medhat","orcid":null},"institutions":[{"id":"https://openalex.org/I130309236","display_name":"Kafrelsheikh University","ror":"https://ror.org/04a97mm30","country_code":"EG","type":"education","lineage":["https://openalex.org/I130309236"]}],"countries":["EG"],"is_corresponding":false,"raw_author_name":"T. Medhat","raw_affiliation_strings":["Department of Electrical Engineering, Faculty of Engineering, Kafrelsheikh University, Kafr El Sheikh, Egypt"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Faculty of Engineering, Kafrelsheikh University, Kafr El Sheikh, Egypt","institution_ids":["https://openalex.org/I130309236"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5040420095"],"corresponding_institution_ids":["https://openalex.org/I130309236"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":1.2952,"has_fulltext":true,"cited_by_count":11,"citation_normalized_percentile":{"value":0.82276631,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":"35","issue":"26","first_page":"19051","last_page":"19067"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.8836265802383423},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8440254926681519},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6356309652328491},{"id":"https://openalex.org/keywords/concatenation","display_name":"Concatenation (mathematics)","score":0.5709463357925415},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5453673005104065},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5282909870147705},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.500551700592041},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4813295602798462},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4772453308105469},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.47432371973991394},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.46890226006507874},{"id":"https://openalex.org/keywords/word-embedding","display_name":"Word embedding","score":0.4540482461452484},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.4453860819339752},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4313313066959381},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.34500226378440857},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.09521499276161194},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.07962203025817871}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.8836265802383423},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8440254926681519},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6356309652328491},{"id":"https://openalex.org/C87619178","wikidata":"https://www.wikidata.org/wiki/Q126002","display_name":"Concatenation (mathematics)","level":2,"score":0.5709463357925415},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5453673005104065},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5282909870147705},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.500551700592041},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4813295602798462},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4772453308105469},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.47432371973991394},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.46890226006507874},{"id":"https://openalex.org/C2777462759","wikidata":"https://www.wikidata.org/wiki/Q18395344","display_name":"Word embedding","level":3,"score":0.4540482461452484},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.4453860819339752},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4313313066959381},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.34500226378440857},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.09521499276161194},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07962203025817871},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s00521-023-08744-1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00521-023-08744-1","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00521-023-08744-1.pdf","source":{"id":"https://openalex.org/S147897268","display_name":"Neural Computing and Applications","issn_l":"0941-0643","issn":["0941-0643","1433-3058"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computing and Applications","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s00521-023-08744-1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00521-023-08744-1","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00521-023-08744-1.pdf","source":{"id":"https://openalex.org/S147897268","display_name":"Neural Computing and Applications","issn_l":"0941-0643","issn":["0941-0643","1433-3058"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computing and Applications","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8100000023841858,"display_name":"Quality Education"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321655","display_name":"Science and Technology Development Fund","ror":"https://ror.org/044vr6g03"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4381094892.pdf"},"referenced_works_count":28,"referenced_works":["https://openalex.org/W1895577753","https://openalex.org/W1902237438","https://openalex.org/W2506483933","https://openalex.org/W2564590796","https://openalex.org/W2604380351","https://openalex.org/W2768477045","https://openalex.org/W2805368175","https://openalex.org/W2963163009","https://openalex.org/W2977433292","https://openalex.org/W2997942948","https://openalex.org/W3011608779","https://openalex.org/W3032651662","https://openalex.org/W3034655362","https://openalex.org/W3034682719","https://openalex.org/W3094673569","https://openalex.org/W3103896273","https://openalex.org/W3113708896","https://openalex.org/W3138298063","https://openalex.org/W3138516171","https://openalex.org/W3154362247","https://openalex.org/W3176169354","https://openalex.org/W3211729376","https://openalex.org/W4312443924","https://openalex.org/W4312937018","https://openalex.org/W6600433979","https://openalex.org/W6600561556","https://openalex.org/W6601955380","https://openalex.org/W6833105446"],"related_works":["https://openalex.org/W2547835662","https://openalex.org/W2546942002","https://openalex.org/W4312545247","https://openalex.org/W4384210086","https://openalex.org/W2945836425","https://openalex.org/W3092611869","https://openalex.org/W3196747313","https://openalex.org/W3193004783","https://openalex.org/W3186858063","https://openalex.org/W3185606300"],"abstract_inverted_index":{"Abstract":[0],"Automatic":[1],"captioning":[2,25,34,63,185],"of":[3,9,17,41,100,141,191,224,242,254],"images":[4,79],"contributes":[5],"to":[6,131,166],"identifying":[7],"features":[8],"multimedia":[10],"content":[11],"and":[12,21,72,84,98,105,127,144,164,200,228,256],"helps":[13],"in":[14,68,80,90],"the":[15,39,70,81,91,112,135,142,146,170,192,209,215,219,234,250],"detection":[16],"interesting":[18],"patterns,":[19],"trends,":[20],"occurrences.":[22],"English":[23],"image":[24,33,62,113,184,204],"has":[26],"recently":[27],"made":[28],"incredible":[29],"progress;":[30],"however,":[31],"Arabic":[32,44,61,108,183],"is":[35,47,152],"still":[36],"lagging.":[37],"In":[38],"field":[40],"machine":[42],"learning,":[43],"image-caption":[45],"generation":[46,148],"generally":[48],"a":[49,56,85,189,240],"very":[50],"difficult":[51],"problem.":[52],"This":[53],"paper":[54],"presents":[55],"more":[57],"accurate":[58,172],"model":[59,89,213,238],"for":[60,145],"by":[64,154],"using":[65,119],"transformer":[66],"models":[67,95,124,195],"both":[69],"encoder":[71,82],"decoder":[73,92],"phases":[74],"as":[75,202],"feature":[76,114,139,205],"extractors":[77],"from":[78,168],"phase":[83],"pre-trained":[86,157,173],"word":[87],"embedding":[88,159,175,212,237],"phase.":[93],"The":[94],"are":[96,102,247],"demonstrated,":[97],"all":[99],"them":[101,134,169],"implemented,":[103],"trained,":[104],"tested":[106,153],"on":[107],"Flickr8k":[109],"datasets.":[110],"For":[111],"extraction":[115],"subsystem,":[116,150],"we":[117],"compared":[118],"three":[120,193],"different":[121,156],"individual":[122],"vision":[123],"(SWIN,":[125],"XCIT,":[126],"ConvNexT)":[128],"with":[129,198,208,226,229,232,244],"concatenation":[130,190],"get":[132],"among":[133,218],"most":[136,171],"expressive":[137],"extracted":[138],"vector":[140],"image,":[143],"caption":[147],"lingual":[149],"which":[151,246],"four":[155],"language":[158,174,211,236],"models:":[160],"(ARABERT,":[161],"ARAELECTRA,":[162],"MARBERTv2,":[163],"CamelBERT),":[165],"select":[167],"model.":[176],"Our":[177],"experiments":[178],"showed":[179],"that":[180,187],"building":[181],"an":[182,203],"system":[186],"uses":[188],"transformer-based":[194],"ConvNexT":[196,230],"combined":[197,207,231],"SWIN":[199,233],"XCIT":[201],"extractor,":[206],"CamelBERT":[210],"produces":[214],"best":[216],"results":[217],"other":[220],"combinations,":[221],"having":[222,239],"scores":[223],"0.5980":[225],"BLEU-1":[227],"araelectra":[235],"score":[241],"0.1664":[243],"BLEU-4":[245],"higher":[248],"than":[249],"previously":[251],"reported":[252],"values":[253],"0.443":[255],"0.157.":[257]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":2}],"updated_date":"2026-01-20T17:24:06.736184","created_date":"2025-10-10T00:00:00"}
