{"id":"https://openalex.org/W4313422350","doi":"https://doi.org/10.1007/s00530-022-01036-z","title":"Layer-wise enhanced transformer with multi-modal fusion for image caption","display_name":"Layer-wise enhanced transformer with multi-modal fusion for image caption","publication_year":2022,"publication_date":"2022-12-19","ids":{"openalex":"https://openalex.org/W4313422350","doi":"https://doi.org/10.1007/s00530-022-01036-z"},"language":"en","primary_location":{"id":"doi:10.1007/s00530-022-01036-z","is_oa":false,"landing_page_url":"https://doi.org/10.1007/s00530-022-01036-z","pdf_url":null,"source":{"id":"https://openalex.org/S112262039","display_name":"Multimedia Systems","issn_l":"0942-4962","issn":["0942-4962","1432-1882"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Multimedia Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027705753","display_name":"Jingdan Li","orcid":null},"institutions":[{"id":"https://openalex.org/I136765683","display_name":"Tianjin University of Technology","ror":"https://ror.org/00zbe0w13","country_code":"CN","type":"education","lineage":["https://openalex.org/I136765683"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jingdan Li","raw_affiliation_strings":["Key Laboratory of Computer Vision and System (Ministry of Education), Tianjin University of Technology, Tianjin, 300384, China","Tianjin Key Laboratory of Intelligence Computing and Novel Software Technology, Tianjin University of Technology, Tianjin, 300384, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Computer Vision and System (Ministry of Education), Tianjin University of Technology, Tianjin, 300384, China","institution_ids":["https://openalex.org/I136765683"]},{"raw_affiliation_string":"Tianjin Key Laboratory of Intelligence Computing and Novel Software Technology, Tianjin University of Technology, Tianjin, 300384, China","institution_ids":["https://openalex.org/I136765683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100784213","display_name":"Yi Wang","orcid":"https://orcid.org/0000-0001-8659-4724"},"institutions":[{"id":"https://openalex.org/I136765683","display_name":"Tianjin University of Technology","ror":"https://ror.org/00zbe0w13","country_code":"CN","type":"education","lineage":["https://openalex.org/I136765683"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yi Wang","raw_affiliation_strings":["Key Laboratory of Computer Vision and System (Ministry of Education), Tianjin University of Technology, Tianjin, 300384, China","Tianjin Key Laboratory of Intelligence Computing and Novel Software Technology, Tianjin University of Technology, Tianjin, 300384, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Computer Vision and System (Ministry of Education), Tianjin University of Technology, Tianjin, 300384, China","institution_ids":["https://openalex.org/I136765683"]},{"raw_affiliation_string":"Tianjin Key Laboratory of Intelligence Computing and Novel Software Technology, Tianjin University of Technology, Tianjin, 300384, China","institution_ids":["https://openalex.org/I136765683"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005975642","display_name":"Dexin Zhao","orcid":"https://orcid.org/0009-0001-0009-9595"},"institutions":[{"id":"https://openalex.org/I136765683","display_name":"Tianjin University of Technology","ror":"https://ror.org/00zbe0w13","country_code":"CN","type":"education","lineage":["https://openalex.org/I136765683"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dexin Zhao","raw_affiliation_strings":["Key Laboratory of Computer Vision and System (Ministry of Education), Tianjin University of Technology, Tianjin, 300384, China","Tianjin Key Laboratory of Intelligence Computing and Novel Software Technology, Tianjin University of Technology, Tianjin, 300384, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Computer Vision and System (Ministry of Education), Tianjin University of Technology, Tianjin, 300384, China","institution_ids":["https://openalex.org/I136765683"]},{"raw_affiliation_string":"Tianjin Key Laboratory of Intelligence Computing and Novel Software Technology, Tianjin University of Technology, Tianjin, 300384, China","institution_ids":["https://openalex.org/I136765683"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5027705753"],"corresponding_institution_ids":["https://openalex.org/I136765683"],"apc_list":null,"apc_paid":null,"fwci":1.2232,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.80792638,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"29","issue":"3","first_page":"1043","last_page":"1056"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.838150680065155},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5952120423316956},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5648820400238037},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4682753086090088},{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.458976686000824},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.44745275378227234},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.4314190149307251},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.22405710816383362}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.838150680065155},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5952120423316956},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5648820400238037},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4682753086090088},{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.458976686000824},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.44745275378227234},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.4314190149307251},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.22405710816383362},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s00530-022-01036-z","is_oa":false,"landing_page_url":"https://doi.org/10.1007/s00530-022-01036-z","pdf_url":null,"source":{"id":"https://openalex.org/S112262039","display_name":"Multimedia Systems","issn_l":"0942-4962","issn":["0942-4962","1432-1882"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Multimedia Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.7300000190734863}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1931639407","https://openalex.org/W1956340063","https://openalex.org/W2064675550","https://openalex.org/W2101105183","https://openalex.org/W2133512280","https://openalex.org/W2194775991","https://openalex.org/W2253806798","https://openalex.org/W2302086703","https://openalex.org/W2481240925","https://openalex.org/W2506483933","https://openalex.org/W2575842049","https://openalex.org/W2745461083","https://openalex.org/W2800782462","https://openalex.org/W2885013662","https://openalex.org/W2890531016","https://openalex.org/W2904551248","https://openalex.org/W2963084599","https://openalex.org/W2963101956","https://openalex.org/W2963595025","https://openalex.org/W2968660381","https://openalex.org/W2981165461","https://openalex.org/W2986670728","https://openalex.org/W2990818246","https://openalex.org/W3034316193","https://openalex.org/W3034655362","https://openalex.org/W3035497460","https://openalex.org/W3167939936","https://openalex.org/W3174377922","https://openalex.org/W3175824375","https://openalex.org/W4200094402","https://openalex.org/W4205357838","https://openalex.org/W4312263373","https://openalex.org/W6600042794","https://openalex.org/W6600339457","https://openalex.org/W6601939488"],"related_works":["https://openalex.org/W4210416330","https://openalex.org/W2949362007","https://openalex.org/W2775506363","https://openalex.org/W4310447809","https://openalex.org/W4200243030","https://openalex.org/W2800782462","https://openalex.org/W4323777661","https://openalex.org/W3209117276","https://openalex.org/W4388184981","https://openalex.org/W2221419418"],"abstract_inverted_index":null,"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
