{"id":"https://openalex.org/W7130364403","doi":"https://doi.org/10.48550/arxiv.2602.15405","title":"Joint Enhancement and Classification using Coupled Diffusion Models of Signals and Logits","display_name":"Joint Enhancement and Classification using Coupled Diffusion Models of Signals and Logits","publication_year":2026,"publication_date":"2026-02-17","ids":{"openalex":"https://openalex.org/W7130364403","doi":"https://doi.org/10.48550/arxiv.2602.15405"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2602.15405","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.15405","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2602.15405","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126332103","display_name":"Gilad Nurko","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Nurko, Gilad","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092998293","display_name":"Roi Benita","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Benita, Roi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035675810","display_name":"Yehoshua Dissen","orcid":"https://orcid.org/0000-0002-9380-8169"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dissen, Yehoshua","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126332424","display_name":"Tomohiro Nakatani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nakatani, Tomohiro","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123640883","display_name":"Marc Delcroix","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Delcroix, Marc","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009309584","display_name":"Shoko Araki","orcid":"https://orcid.org/0000-0003-4363-4305"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Araki, Shoko","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5043768519","display_name":"Yossi Keshet","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Keshet, Joseph","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5126332103"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.25690001249313354,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.25690001249313354,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.1242000013589859,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.08550000190734863,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.5888000130653381},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5271000266075134},{"id":"https://openalex.org/keywords/signal","display_name":"SIGNAL (programming language)","score":0.5171999931335449},{"id":"https://openalex.org/keywords/joint","display_name":"Joint (building)","score":0.5009999871253967},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.446399986743927},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.44440001249313354},{"id":"https://openalex.org/keywords/noise-measurement","display_name":"Noise measurement","score":0.3546000123023987}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6478999853134155},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5924000144004822},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.5888000130653381},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5271000266075134},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.5171999931335449},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.5009999871253967},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.446399986743927},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.44440001249313354},{"id":"https://openalex.org/C29265498","wikidata":"https://www.wikidata.org/wiki/Q7047719","display_name":"Noise measurement","level":3,"score":0.3546000123023987},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.3546000123023987},{"id":"https://openalex.org/C104267543","wikidata":"https://www.wikidata.org/wiki/Q208163","display_name":"Signal processing","level":3,"score":0.35199999809265137},{"id":"https://openalex.org/C152139883","wikidata":"https://www.wikidata.org/wiki/Q252973","display_name":"Mutual information","level":2,"score":0.34769999980926514},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.31360000371932983},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.30959999561309814},{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.2994999885559082},{"id":"https://openalex.org/C18653775","wikidata":"https://www.wikidata.org/wiki/Q1333358","display_name":"Joint probability distribution","level":2,"score":0.28369998931884766},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.2802000045776367},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.25099998712539673}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2602.15405","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.15405","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2602.15405","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.15405","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.7544705271720886,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Robust":[0],"classification":[1,19,139,158],"in":[2,9,41,157],"noisy":[3],"environments":[4],"remains":[5],"a":[6,31,52],"fundamental":[7],"challenge":[8],"machine":[10],"learning.":[11],"Standard":[12],"approaches":[13],"typically":[14],"treat":[15],"signal":[16,27,67,94,107],"enhancement":[17,135,150],"and":[18,28,68,128,140,154],"as":[20],"separate,":[21],"sequential":[22,149],"stages:":[23],"first":[24],"enhancing":[25,93],"the":[26,38,42,65,69,72,83,92,96,101,106,113,122,126,129],"then":[29],"applying":[30],"classifier.":[32,84],"This":[33,85],"approach":[34],"fails":[35],"to":[36,119],"leverage":[37],"semantic":[39],"information":[40],"classifier's":[43,73],"output":[44,74],"during":[45],"denoising.":[46],"In":[47],"this":[48],"work,":[49],"we":[50],"propose":[51],"general,":[53],"domain-agnostic":[54],"framework":[55,146],"that":[56],"integrates":[57],"two":[58],"interacting":[59],"diffusion":[60],"models:":[61],"one":[62],"operating":[63],"on":[64,71],"input":[66,127],"other":[70],"logits,":[75],"without":[76],"requiring":[77],"any":[78],"retraining":[79],"or":[80],"fine-tuning":[81],"of":[82,112,125],"coupled":[86],"formulation":[87],"enables":[88],"mutual":[89],"guidance,":[90],"where":[91],"refines":[95],"class":[97,103],"estimation":[98],"and,":[99],"conversely,":[100],"evolving":[102],"logits":[104],"guide":[105],"reconstruction":[108],"towards":[109],"discriminative":[110],"regions":[111],"manifold.":[114],"We":[115,131],"introduce":[116],"three":[117],"strategies":[118],"effectively":[120],"model":[121],"joint":[123,134],"distribution":[124],"logit.":[130],"evaluated":[132],"our":[133],"method":[136],"for":[137],"image":[138],"automatic":[141],"speech":[142],"recognition.":[143],"The":[144],"proposed":[145],"surpasses":[147],"traditional":[148],"baselines,":[151],"delivering":[152],"robust":[153],"flexible":[155],"improvements":[156],"accuracy":[159],"under":[160],"diverse":[161],"noise":[162],"conditions.":[163]},"counts_by_year":[],"updated_date":"2026-02-19T06:31:58.851227","created_date":"2026-02-19T00:00:00"}
