{"id":"https://openalex.org/W4415325527","doi":"https://doi.org/10.1007/978-981-95-3459-3_38","title":"Image Captioning via\u00a0Masked Conditional Diffusion","display_name":"Image Captioning via\u00a0Masked Conditional Diffusion","publication_year":2025,"publication_date":"2025-10-18","ids":{"openalex":"https://openalex.org/W4415325527","doi":"https://doi.org/10.1007/978-981-95-3459-3_38"},"language":"en","primary_location":{"id":"doi:10.1007/978-981-95-3459-3_38","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-981-95-3459-3_38","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Jiayi Zhou","orcid":"https://orcid.org/0009-0004-5369-6627"},"institutions":[{"id":"https://openalex.org/I141568987","display_name":"Hong Kong Baptist University","ror":"https://ror.org/0145fw131","country_code":"HK","type":"education","lineage":["https://openalex.org/I141568987"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Jiayi Zhou","raw_affiliation_strings":["Hong Kong Baptist University, Hong Kong SAR, China"],"raw_orcid":"https://orcid.org/0009-0004-5369-6627","affiliations":[{"raw_affiliation_string":"Hong Kong Baptist University, Hong Kong SAR, China","institution_ids":["https://openalex.org/I141568987"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100369885","display_name":"Chen Li","orcid":"https://orcid.org/0000-0002-8784-8148"},"institutions":[{"id":"https://openalex.org/I14314212","display_name":"Osaka University of Economics","ror":"https://ror.org/04g11bp59","country_code":"JP","type":"education","lineage":["https://openalex.org/I14314212"]},{"id":"https://openalex.org/I4210111835","display_name":"Osaka Health Science University","ror":"https://ror.org/01tvqd679","country_code":"JP","type":"education","lineage":["https://openalex.org/I4210111835"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Chen Li","raw_affiliation_strings":["D3 Center, The University of Osaka, Osaka, Japan"],"raw_orcid":"https://orcid.org/0000-0002-8784-8148","affiliations":[{"raw_affiliation_string":"D3 Center, The University of Osaka, Osaka, Japan","institution_ids":["https://openalex.org/I14314212","https://openalex.org/I4210111835"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084952571","display_name":"Huidong Tang","orcid":"https://orcid.org/0000-0002-5141-2457"},"institutions":[{"id":"https://openalex.org/I4210154121","display_name":"Shandong Institute of Commerce & Technology","ror":"https://ror.org/03xk2yz39","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210154121"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huidong Tang","raw_affiliation_strings":["Shandong Institute of Commerce and Technology, Jinan, China"],"raw_orcid":"https://orcid.org/0000-0002-5141-2457","affiliations":[{"raw_affiliation_string":"Shandong Institute of Commerce and Technology, Jinan, China","institution_ids":["https://openalex.org/I4210154121"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071032734","display_name":"Sayaka Kamei","orcid":"https://orcid.org/0000-0003-1716-3028"},"institutions":[{"id":"https://openalex.org/I113306721","display_name":"Hiroshima University","ror":"https://ror.org/03t78wx29","country_code":"JP","type":"education","lineage":["https://openalex.org/I113306721"]},{"id":"https://openalex.org/I4210126469","display_name":"Higashihiroshima Medical Center","ror":"https://ror.org/03bd22t26","country_code":"JP","type":"healthcare","lineage":["https://openalex.org/I4210126469","https://openalex.org/I4210137409"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Sayaka Kamei","raw_affiliation_strings":["Hiroshima University, Higashihiroshima, Japan"],"raw_orcid":"https://orcid.org/0000-0003-1716-3028","affiliations":[{"raw_affiliation_string":"Hiroshima University, Higashihiroshima, Japan","institution_ids":["https://openalex.org/I4210126469","https://openalex.org/I113306721"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101847022","display_name":"Shuai Jiang","orcid":"https://orcid.org/0000-0002-3046-8689"},"institutions":[{"id":"https://openalex.org/I113306721","display_name":"Hiroshima University","ror":"https://ror.org/03t78wx29","country_code":"JP","type":"education","lineage":["https://openalex.org/I113306721"]},{"id":"https://openalex.org/I4210126469","display_name":"Higashihiroshima Medical Center","ror":"https://ror.org/03bd22t26","country_code":"JP","type":"healthcare","lineage":["https://openalex.org/I4210126469","https://openalex.org/I4210137409"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Shuai Jiang","raw_affiliation_strings":["Hiroshima University, Higashihiroshima, Japan"],"raw_orcid":"https://orcid.org/0000-0002-3046-8689","affiliations":[{"raw_affiliation_string":"Hiroshima University, Higashihiroshima, Japan","institution_ids":["https://openalex.org/I4210126469","https://openalex.org/I113306721"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078425375","display_name":"Yasuhiko Morimoto","orcid":"https://orcid.org/0000-0001-7130-2864"},"institutions":[{"id":"https://openalex.org/I113306721","display_name":"Hiroshima University","ror":"https://ror.org/03t78wx29","country_code":"JP","type":"education","lineage":["https://openalex.org/I113306721"]},{"id":"https://openalex.org/I4210126469","display_name":"Higashihiroshima Medical Center","ror":"https://ror.org/03bd22t26","country_code":"JP","type":"healthcare","lineage":["https://openalex.org/I4210126469","https://openalex.org/I4210137409"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yasuhiko Morimoto","raw_affiliation_strings":["Hiroshima University, Higashihiroshima, Japan"],"raw_orcid":"https://orcid.org/0000-0001-7130-2864","affiliations":[{"raw_affiliation_string":"Hiroshima University, Higashihiroshima, Japan","institution_ids":["https://openalex.org/I4210126469","https://openalex.org/I113306721"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I141568987"],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.62403101,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"482","last_page":"495"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.8238999843597412},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5845999717712402},{"id":"https://openalex.org/keywords/autoregressive-model","display_name":"Autoregressive model","score":0.5634999871253967},{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.557200014591217},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.557200014591217},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.49059998989105225},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.42820000648498535},{"id":"https://openalex.org/keywords/image-denoising","display_name":"Image denoising","score":0.3869999945163727}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.8238999843597412},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8090999722480774},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.65420001745224},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5845999717712402},{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.5634999871253967},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.557200014591217},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.557200014591217},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.49059998989105225},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.42820000648498535},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.39559999108314514},{"id":"https://openalex.org/C2983327147","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Image denoising","level":3,"score":0.3869999945163727},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.34470000863075256},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.34139999747276306},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3253999948501587},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.3208000063896179},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.31940001249313354},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.31709998846054077},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.31690001487731934},{"id":"https://openalex.org/C203504353","wikidata":"https://www.wikidata.org/wiki/Q4765461","display_name":"Anisotropic diffusion","level":3,"score":0.3158999979496002},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.27639999985694885}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/978-981-95-3459-3_38","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-981-95-3459-3_38","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W1895577753","https://openalex.org/W1947481528","https://openalex.org/W1956340063","https://openalex.org/W2101105183","https://openalex.org/W2255466643","https://openalex.org/W2506483933","https://openalex.org/W2745461083","https://openalex.org/W2963992143","https://openalex.org/W2986670728","https://openalex.org/W3034655362","https://openalex.org/W3093394956","https://openalex.org/W3153469116","https://openalex.org/W3167939936","https://openalex.org/W3180355996","https://openalex.org/W3205981128","https://openalex.org/W4312388283","https://openalex.org/W4312933868","https://openalex.org/W4375868765","https://openalex.org/W4386072307","https://openalex.org/W4402754015"],"related_works":[],"abstract_inverted_index":null,"counts_by_year":[],"updated_date":"2026-06-13T06:13:01.061226","created_date":"2025-10-19T00:00:00"}
