{"id":"https://openalex.org/W7140162297","doi":"https://doi.org/10.48550/arxiv.2603.21092","title":"Generative Artificial Intelligence Assisted Multi-modal Semantic Extraction for NOMA-based Image Transmissions","display_name":"Generative Artificial Intelligence Assisted Multi-modal Semantic Extraction for NOMA-based Image Transmissions","publication_year":2026,"publication_date":"2026-03-22","ids":{"openalex":"https://openalex.org/W7140162297","doi":"https://doi.org/10.48550/arxiv.2603.21092"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.21092","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.21092","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.21092","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Zhao, Songhan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Songhan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Gong, Shimin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gong, Shimin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Gu, Bo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gu, Bo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Du, Hongyang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Du, Hongyang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Mu, Xidong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mu, Xidong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Xiong, Zehui","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiong, Zehui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Fang, Yuming","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fang, Yuming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11458","display_name":"Advanced Wireless Communication Technologies","score":0.7738999724388123,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11458","display_name":"Advanced Wireless Communication Technologies","score":0.7738999724388123,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12131","display_name":"Wireless Signal Modulation Classification","score":0.12470000237226486,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10964","display_name":"Wireless Communication Security Techniques","score":0.011699999682605267,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/semantic-feature","display_name":"Semantic feature","score":0.4830999970436096},{"id":"https://openalex.org/keywords/semantic-computing","display_name":"Semantic computing","score":0.47290000319480896},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4521999955177307},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.4490000009536743},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4291999936103821},{"id":"https://openalex.org/keywords/transmission","display_name":"Transmission (telecommunications)","score":0.4092999994754791},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.39149999618530273},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.37630000710487366}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8363999724388123},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5117999911308289},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.4830999970436096},{"id":"https://openalex.org/C511149849","wikidata":"https://www.wikidata.org/wiki/Q7449051","display_name":"Semantic computing","level":3,"score":0.47290000319480896},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4521999955177307},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.4490000009536743},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4291999936103821},{"id":"https://openalex.org/C761482","wikidata":"https://www.wikidata.org/wiki/Q118093","display_name":"Transmission (telecommunications)","level":2,"score":0.4092999994754791},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.39149999618530273},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.37630000710487366},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35929998755455017},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.33480000495910645},{"id":"https://openalex.org/C86034646","wikidata":"https://www.wikidata.org/wiki/Q474311","display_name":"Semantic gap","level":4,"score":0.3147999942302704},{"id":"https://openalex.org/C202708506","wikidata":"https://www.wikidata.org/wiki/Q7449050","display_name":"Semantic compression","level":5,"score":0.31459999084472656},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.31299999356269836},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.310699999332428},{"id":"https://openalex.org/C103692084","wikidata":"https://www.wikidata.org/wiki/Q1765824","display_name":"Semantic grid","level":3,"score":0.28769999742507935},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.2858999967575073},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.28519999980926514},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.28349998593330383},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.2815000116825104},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.26010000705718994},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.257099986076355}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.21092","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.21092","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.21092","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.21092","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3,131,143],"investigate":[4],"a":[5,40,85],"generative":[6],"artificial":[7],"intelligence":[8],"(GAI)-assisted":[9],"semantic":[10,25,51,69,77,92,99,104,125,148,178,188],"communication":[11],"framework":[12,199],"for":[13,35],"non-orthogonal":[14],"multiple":[15],"access":[16],"(NOMA)-based":[17],"image":[18,36,52],"transmissions.":[19],"Semantic":[20],"users":[21],"(SUs)":[22],"extract":[23],"cross-modal":[24],"features":[26,126,149],"from":[27],"the":[28,46,68,98,103,109,117,152,165,173,177,182,187,192,197,202,207],"raw":[29],"images,":[30],"which":[31],"are":[32,161],"then":[33],"used":[34,162],"recovery":[37,49,78,93,189],"by":[38,95],"leveraging":[39],"GAI":[41,44],"model.":[42],"The":[43],"enhances":[45],"generalization":[47],"and":[48,71,80,91,112,127,135,145,181,191],"of":[50,88,155,176],"transmissions,":[53],"while":[54,157],"NOMA":[55,113],"efficiently":[56],"allocates":[57],"transmission":[58,72,81,89,118,166,183,193],"capacities":[59],"to":[60,150,163,205,211],"SUs":[61],"based":[62],"on":[63],"their":[64],"traffic":[65],"demands.":[66],"Thus,":[67],"extraction":[70],"control":[73,167,184],"jointly":[74,96],"affect":[75],"both":[76],"performance":[79,87],"overhead.":[82],"We":[83],"maximize":[84],"weighted":[86],"latency":[90,194],"accuracy":[94,190],"optimizing":[97],"feature":[100,179],"selection":[101,180],"at":[102,116],"level,":[105],"as":[106,108],"well":[107],"receive":[110],"beamforming":[111],"decoding":[114],"order":[115],"level.":[119],"To":[120],"reduce":[121],"potential":[122],"redundancy":[123],"in":[124],"improve":[128,206],"optimization":[129,139,159],"efficiency,":[130],"develop":[132],"an":[133],"importance-aware":[134],"model-driven":[136],"proximal":[137],"policy":[138],"(IM-PPO)":[140],"framework.":[141],"Specifically,":[142],"quantify":[144],"retain":[146],"high-importance":[147],"enhance":[151],"learning":[153,208],"efficiency":[154,209],"PPO,":[156],"model-based":[158],"methods":[160],"adapt":[164],"variables.":[168],"Numerical":[169],"results":[170],"validate":[171],"that":[172],"joint":[174],"adjustment":[175],"significantly":[185],"improves":[186],"performance.":[195],"Moreover,":[196],"IM-PPO":[198],"effectively":[200],"leverages":[201],"model":[203],"information":[204],"compared":[210],"benchmark":[212],"methods.":[213]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-03-25T00:00:00"}
