{"id":"https://openalex.org/W4404037698","doi":"https://doi.org/10.1109/mlsp58920.2024.10734744","title":"Multimodal Generative Semantic Communication Based on Latent Diffusion Model","display_name":"Multimodal Generative Semantic Communication Based on Latent Diffusion Model","publication_year":2024,"publication_date":"2024-09-22","ids":{"openalex":"https://openalex.org/W4404037698","doi":"https://doi.org/10.1109/mlsp58920.2024.10734744"},"language":"en","primary_location":{"id":"doi:10.1109/mlsp58920.2024.10734744","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mlsp58920.2024.10734744","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE 34th International Workshop on Machine Learning for Signal Processing (MLSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080080275","display_name":"Weiqi Fu","orcid":"https://orcid.org/0000-0002-7368-383X"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weiqi Fu","raw_affiliation_strings":["School of Computer Science (National Pilot Software Engineering School), Beijing University of Posts and Telecommunications,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science (National Pilot Software Engineering School), Beijing University of Posts and Telecommunications,Beijing,China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052560055","display_name":"Lianming Xu","orcid":"https://orcid.org/0009-0006-9142-8863"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lianming Xu","raw_affiliation_strings":["Beijing University of Posts and Telecommunications,School of Electronic Engineering,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications,School of Electronic Engineering,Beijing,China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100761149","display_name":"Xin Wu","orcid":"https://orcid.org/0000-0002-1733-3560"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Wu","raw_affiliation_strings":["School of Computer Science (National Pilot Software Engineering School), Beijing University of Posts and Telecommunications,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science (National Pilot Software Engineering School), Beijing University of Posts and Telecommunications,Beijing,China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103884765","display_name":"Haoyang Wei","orcid":null},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haoyang Wei","raw_affiliation_strings":["School of Computer Science (National Pilot Software Engineering School), Beijing University of Posts and Telecommunications,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science (National Pilot Software Engineering School), Beijing University of Posts and Telecommunications,Beijing,China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5115695478","display_name":"Li Wang","orcid":"https://orcid.org/0000-0002-0496-9500"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Li Wang","raw_affiliation_strings":["School of Computer Science (National Pilot Software Engineering School), Beijing University of Posts and Telecommunications,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science (National Pilot Software Engineering School), Beijing University of Posts and Telecommunications,Beijing,China","institution_ids":["https://openalex.org/I139759216"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.2219,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.83421903,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.7849000096321106,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.7849000096321106,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.7163000106811523,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.6653000116348267,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7501826286315918},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.7108221650123596},{"id":"https://openalex.org/keywords/probabilistic-latent-semantic-analysis","display_name":"Probabilistic latent semantic analysis","score":0.6620131731033325},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.6245509386062622},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4882345497608185},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4874532222747803},{"id":"https://openalex.org/keywords/latent-dirichlet-allocation","display_name":"Latent Dirichlet allocation","score":0.48128455877304077},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.24314367771148682}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7501826286315918},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.7108221650123596},{"id":"https://openalex.org/C112933361","wikidata":"https://www.wikidata.org/wiki/Q2845258","display_name":"Probabilistic latent semantic analysis","level":2,"score":0.6620131731033325},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.6245509386062622},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4882345497608185},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4874532222747803},{"id":"https://openalex.org/C500882744","wikidata":"https://www.wikidata.org/wiki/Q269236","display_name":"Latent Dirichlet allocation","level":3,"score":0.48128455877304077},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.24314367771148682}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/mlsp58920.2024.10734744","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mlsp58920.2024.10734744","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE 34th International Workshop on Machine Learning for Signal Processing (MLSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W2774839435","https://openalex.org/W2946889564","https://openalex.org/W2962785568","https://openalex.org/W3036851434","https://openalex.org/W3047615889","https://openalex.org/W3166791908","https://openalex.org/W4206175303","https://openalex.org/W4226115138","https://openalex.org/W4312933868","https://openalex.org/W4381785967","https://openalex.org/W4391677749","https://openalex.org/W6765779288","https://openalex.org/W6779823529","https://openalex.org/W6853140940"],"related_works":["https://openalex.org/W1551384396","https://openalex.org/W2251863249","https://openalex.org/W2096865229","https://openalex.org/W2353826422","https://openalex.org/W2921491680","https://openalex.org/W2612095515","https://openalex.org/W3033561275","https://openalex.org/W2894783287","https://openalex.org/W2110027950","https://openalex.org/W4291700620"],"abstract_inverted_index":{"In":[0],"emergencies,":[1],"the":[2,93,96,100,106,126,140,157],"ability":[3],"to":[4,15,34,87,120,131,153],"quickly":[5],"and":[6,11,14,37,64,74,83,164,175],"accurately":[7],"gather":[8],"environmental":[9],"data":[10,89,124],"command":[12],"information,":[13],"make":[16],"timely":[17],"decisions,":[18],"is":[19,118],"particularly":[20],"critical.":[21],"Traditional":[22],"semantic":[23,53,71,107,161],"communication":[24,54,162],"frameworks,":[25],"primarily":[26],"based":[27,104,114],"on":[28,105,115],"a":[29,50,78,110,148],"single":[30],"modality,":[31],"are":[32],"susceptible":[33],"complex":[35],"environments":[36],"lighting":[38],"conditions,":[39],"thereby":[40],"limiting":[41],"decision":[42],"accuracy.":[43],"To":[44],"this":[45,47],"end,":[46,95],"paper":[48],"introduces":[49],"multimodal":[51,102],"generative":[52],"framework":[55,59,97],"named":[56],"mm-GESCO.":[57],"The":[58],"ingests":[60],"streams":[61],"of":[62,80,135,151,159],"visible":[63],"infrared":[65],"modal":[66,123],"image":[67],"data,":[68],"generates":[69],"fused":[70],"segmentation":[72],"maps,":[73],"transmits":[75],"them":[76],"using":[77],"combination":[79],"one-hot":[81],"encoding":[82],"zlib":[84],"compression":[85,149],"techniques":[86],"enhance":[88],"transmission":[90],"efficiency.":[91],"At":[92],"receiving":[94],"can":[98],"reconstruct":[99,132],"original":[101],"images":[103],"maps.":[108],"Additionally,":[109],"latent":[111,127,133],"diffusion":[112],"model":[113],"contrastive":[116],"learning":[117],"designed":[119],"align":[121],"different":[122],"within":[125],"space,":[128],"allowing":[129],"mm-GESCO":[130,146],"features":[134],"any":[136],"modality":[137],"presented":[138],"at":[139],"input.":[141],"Experimental":[142],"results":[143],"demonstrate":[144],"that":[145],"achieves":[147],"ratio":[150],"up":[152],"200":[154],"times,":[155],"surpassing":[156],"performance":[158,167],"existing":[160],"frameworks":[163],"exhibiting":[165],"excellent":[166],"in":[168],"downstream":[169],"tasks":[170],"such":[171],"as":[172],"object":[173],"classification":[174],"detection.":[176]},"counts_by_year":[{"year":2025,"cited_by_count":4}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
