{"id":"https://openalex.org/W4413157648","doi":"https://doi.org/10.1109/access.2025.3598598","title":"An Image Semantic Representation Method Based on Cross-Modal Adaptive Multi-Layer Perceptron","display_name":"An Image Semantic Representation Method Based on Cross-Modal Adaptive Multi-Layer Perceptron","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4413157648","doi":"https://doi.org/10.1109/access.2025.3598598"},"language":"en","primary_location":{"id":"doi:10.1109/access.2025.3598598","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3598598","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2025.3598598","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Yang Liu","orcid":"https://orcid.org/0009-0006-4017-260X"},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yang Liu","raw_affiliation_strings":["School of Geosciences and Info-Physics, Central South University, Changsha, China"],"raw_orcid":"https://orcid.org/0009-0006-4017-260X","affiliations":[{"raw_affiliation_string":"School of Geosciences and Info-Physics, Central South University, Changsha, China","institution_ids":["https://openalex.org/I139660479"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002399867","display_name":"Xiulei Liu","orcid":"https://orcid.org/0000-0002-9303-3682"},"institutions":[{"id":"https://openalex.org/I78675632","display_name":"Beijing Information Science & Technology University","ror":"https://ror.org/04xnqep60","country_code":"CN","type":"education","lineage":["https://openalex.org/I78675632"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiulei Liu","raw_affiliation_strings":["Computer School, Beijing Information Science and Technology University, Beijing, China","Beijing Information Science and Technology University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-9303-3682","affiliations":[{"raw_affiliation_string":"Computer School, Beijing Information Science and Technology University, Beijing, China","institution_ids":["https://openalex.org/I78675632"]},{"raw_affiliation_string":"Beijing Information Science and Technology University, Beijing, China","institution_ids":["https://openalex.org/I78675632"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005693926","display_name":"Chengli Peng","orcid":null},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chengli Peng","raw_affiliation_strings":["School of Geosciences and Info-Physics, Central South University, Changsha, China"],"raw_orcid":"https://orcid.org/0009-0008-4867-1758","affiliations":[{"raw_affiliation_string":"School of Geosciences and Info-Physics, Central South University, Changsha, China","institution_ids":["https://openalex.org/I139660479"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I139660479"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.17431695,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"13","issue":null,"first_page":"143351","last_page":"143359"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.8776999711990356,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.8776999711990356,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7612431049346924},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.6517423987388611},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5940017104148865},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5807605385780334},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5435400605201721},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4819366931915283},{"id":"https://openalex.org/keywords/perceptron","display_name":"Perceptron","score":0.45938804745674133},{"id":"https://openalex.org/keywords/layer","display_name":"Layer (electronics)","score":0.4363245964050293},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3926674723625183},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.21633151173591614},{"id":"https://openalex.org/keywords/materials-science","display_name":"Materials science","score":0.08153665065765381}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7612431049346924},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.6517423987388611},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5940017104148865},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5807605385780334},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5435400605201721},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4819366931915283},{"id":"https://openalex.org/C60908668","wikidata":"https://www.wikidata.org/wiki/Q690207","display_name":"Perceptron","level":3,"score":0.45938804745674133},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.4363245964050293},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3926674723625183},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.21633151173591614},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.08153665065765381},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2025.3598598","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3598598","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:311db0064cfe4000b748a65705bac1e2","is_oa":true,"landing_page_url":"https://doaj.org/article/311db0064cfe4000b748a65705bac1e2","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 13, Pp 143351-143359 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2025.3598598","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3598598","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321514","display_name":"Central South University","ror":"https://ror.org/00f1zfq44"},{"id":"https://openalex.org/F4320326666","display_name":"Beijing Information Science and Technology University","ror":"https://ror.org/04xnqep60"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1861492603","https://openalex.org/W1905882502","https://openalex.org/W1956340063","https://openalex.org/W2101105183","https://openalex.org/W2302086703","https://openalex.org/W2506483933","https://openalex.org/W2564898401","https://openalex.org/W2745461083","https://openalex.org/W2890531016","https://openalex.org/W2963084599","https://openalex.org/W2963101956","https://openalex.org/W2963686907","https://openalex.org/W2986670728","https://openalex.org/W3034655362","https://openalex.org/W3035284526","https://openalex.org/W3091588028","https://openalex.org/W3133524129","https://openalex.org/W3152685972","https://openalex.org/W3167939936","https://openalex.org/W3173220247","https://openalex.org/W3174377922","https://openalex.org/W4312712450","https://openalex.org/W4312914652","https://openalex.org/W4312922092","https://openalex.org/W4312924260","https://openalex.org/W4372337842","https://openalex.org/W4382460199","https://openalex.org/W4385245566","https://openalex.org/W4387968461","https://openalex.org/W4405440281","https://openalex.org/W4407304007","https://openalex.org/W6631190155","https://openalex.org/W6678262379","https://openalex.org/W6682631176","https://openalex.org/W6763643401","https://openalex.org/W6789705400","https://openalex.org/W6791353385","https://openalex.org/W6811013733","https://openalex.org/W6853754985"],"related_works":["https://openalex.org/W2082756648","https://openalex.org/W3194278305","https://openalex.org/W2289648981","https://openalex.org/W1565459987","https://openalex.org/W2062195135","https://openalex.org/W2379392295","https://openalex.org/W3160965418","https://openalex.org/W45198419","https://openalex.org/W2001427828","https://openalex.org/W4281697769"],"abstract_inverted_index":{"With":[0],"the":[1,7,76,142,148,156,172,181,191,209,221,226,254,262],"development":[2],"of":[3,54,94,106,147,183,193,228,251,256,261],"Multimodal":[4],"information":[5],"research,":[6],"latest":[8],"image":[9,31],"captioning":[10],"aims":[11],"to":[12,61,63,82,135,180,198,239],"generate":[13],"variable-length":[14,65,185],"sentences":[15,66,186],"following":[16],"cross-modal":[17,68,95,188,204],"signals":[18],"(e.g.,":[19],"visual":[20,158],"and":[21,36,90,113,123,144,159,230,234],"text).":[22],"While":[23],"Transformer-based":[24,216],"methods":[25,217],"have":[26],"shown":[27,42],"impressive":[28],"progress":[29],"for":[30,47,59,168],"captioning,":[32],"they":[33],"are":[34,126,162],"complex":[35],"computationally":[37],"expensive.":[38],"Recent":[39],"work":[40],"has":[41],"Multi-layer":[43],"Perceptron\u2019s":[44],"(MLP)":[45],"potential":[46],"lower":[48],"computational":[49,99,145],"cost.":[50],"However,":[51],"fixed-parameter":[52],"weights":[53],"MLP":[55,84,111,133,153],"make":[56],"it":[57],"difficult":[58],"models":[60,242],"adapt":[62,179],"producing":[64],"in":[67,187,203],"scenarios.":[69],"To":[70],"address":[71],"these":[72],"challenges,":[73],"we":[74],"propose":[75],"novel":[77],"Cross-Modal":[78],"Adaptive":[79],"Network":[80],"(CMANet)":[81],"improve":[83],"by":[85,129,218,232],"dynamic":[86,165],"parameter":[87],"weight":[88,166],"settings":[89],"bidirectional":[91,116,174],"semantic":[92],"alignment":[93],"features,":[96],"while":[97,224,253],"enhancing":[98],"efficiency.":[100],"Specifically,":[101],"a":[102,114,151,248],"network":[103],"architecture":[104],"consisting":[105],"two":[107,130],"independent":[108,131],"fixed-weight":[109],"two-layer":[110,132],"modules":[112,134],"dynamic-weight":[115,173],"linear":[117,175],"layer":[118],"module":[119],"was":[120],"designed.":[121],"Visual":[122],"textual":[124,160],"features":[125,161],"first":[127],"processed":[128,157],"extract":[136],"their":[137],"intrinsic":[138],"properties,":[139],"thereby":[140],"improving":[141],"training":[143],"efficiency":[146],"model":[149],"through":[150],"simple":[152],"structure.":[154],"Subsequently,":[155],"used":[163],"as":[164,244],"matrices":[167],"each":[169],"other.":[170],"Through":[171],"layer,":[176],"CMANet":[177,214,246],"can":[178],"requirement":[182],"generating":[184],"scenarios,":[189],"addressing":[190],"issue":[192],"traditional":[194],"MLPs":[195],"being":[196],"unable":[197],"handle":[199],"variable":[200],"text":[201],"lengths":[202],"feature":[205],"relationships.":[206],"Results":[207],"on":[208],"MS-COCO":[210],"dataset":[211],"show":[212],"that":[213],"outperforms":[215],"2.7%":[219],"across":[220],"CIDEr":[222],"score,":[223],"reducing":[225],"number":[227,255],"parameters":[229,257],"GFLOPs":[231],"42.9%":[233],"69.9%,":[235],"respectively.":[236],"In":[237],"comparison":[238],"large-scale":[240],"pre-trained":[241],"such":[243],"LEMON,":[245],"achieves":[247],"performance":[249],"improvement":[250],"1.3%,":[252],"is":[258],"only":[259],"3%":[260],"LEMON.":[263]},"counts_by_year":[],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
