{"id":"https://openalex.org/W4394708943","doi":"https://doi.org/10.48550/arxiv.2404.05980","title":"Tackling Structural Hallucination in Image Translation with Local Diffusion","display_name":"Tackling Structural Hallucination in Image Translation with Local Diffusion","publication_year":2024,"publication_date":"2024-04-09","ids":{"openalex":"https://openalex.org/W4394708943","doi":"https://doi.org/10.48550/arxiv.2404.05980"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2404.05980","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.05980","pdf_url":"https://arxiv.org/pdf/2404.05980","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2404.05980","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023512746","display_name":"Seunghoi Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kim, Seunghoi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061700100","display_name":"Chen Jin","orcid":"https://orcid.org/0000-0002-2179-6445"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Chen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058474860","display_name":"Tom Diethe","orcid":"https://orcid.org/0000-0002-0776-5407"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Diethe, Tom","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061466213","display_name":"Matteo Figini","orcid":"https://orcid.org/0000-0002-8238-2262"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Figini, Matteo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015372912","display_name":"Henry F. J. Tregidgo","orcid":"https://orcid.org/0000-0002-3509-8154"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tregidgo, Henry F. J.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002960442","display_name":"Asher Mullokandov","orcid":"https://orcid.org/0009-0007-8171-4353"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mullokandov, Asher","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067992725","display_name":"Philip Teare","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Teare, Philip","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5033449704","display_name":"Daniel C. Alexander","orcid":"https://orcid.org/0000-0003-2439-350X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alexander, Daniel C.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5023512746"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.9891999959945679,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.9891999959945679,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T13095","display_name":"Plant-based Medicinal Research","score":0.9811999797821045,"subfield":{"id":"https://openalex.org/subfields/3004","display_name":"Pharmacology"},"field":{"id":"https://openalex.org/fields/30","display_name":"Pharmacology, Toxicology and Pharmaceutics"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.7407180070877075},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5272908210754395},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.5205549001693726},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.35679590702056885},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3557414710521698},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.3105126619338989},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.10882210731506348},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.07509505748748779}],"concepts":[{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.7407180070877075},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5272908210754395},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.5205549001693726},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.35679590702056885},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3557414710521698},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3105126619338989},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.10882210731506348},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.07509505748748779},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"pmh:oai:arXiv.org:2404.05980","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.05980","pdf_url":"https://arxiv.org/pdf/2404.05980","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"pmh:oai:eprints.ucl.ac.uk.OAI2:10201190","is_oa":true,"landing_page_url":"https://discovery.ucl.ac.uk/id/eprint/10201190/","pdf_url":"https://discovery.ucl.ac.uk/10201190/1/eccv.pdf","source":{"id":"https://openalex.org/S4306400024","display_name":"UCL Discovery (University College London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45129253","host_organization_name":"University College London","host_organization_lineage":["https://openalex.org/I45129253"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"In: Leonardis, Ale\u0161 and Ricci, Elisa and Roth, Stefan and Russakovsky, Olga and Sattler, Torsten and Varol, G\u00fcl, (eds.) Computer Vision \u2013 ECCV 2024: 18th European Conference, Milan, Italy, September 29\u2013October 4, 2024, Proceedings, Part LXXXI.  (pp. pp. 87-103).  Springer: Cham, Switzerland. (2024)","raw_type":"Proceedings paper"},{"id":"doi:10.48550/arxiv.2404.05980","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2404.05980","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2404.05980","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.05980","pdf_url":"https://arxiv.org/pdf/2404.05980","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2931662336","https://openalex.org/W2077865380","https://openalex.org/W2765597752","https://openalex.org/W2936127876","https://openalex.org/W4213477128","https://openalex.org/W4287300272","https://openalex.org/W3155045749","https://openalex.org/W3134797699"],"abstract_inverted_index":{"Recent":[0],"developments":[1],"in":[2,22,40,58,125],"diffusion":[3,67,141],"models":[4,115],"have":[5],"advanced":[6],"conditioned":[7],"image":[8,54,131],"generation,":[9],"yet":[10],"they":[11],"struggle":[12],"with":[13,72,138],"reconstructing":[14],"out-of-distribution":[15],"(OOD)":[16],"images,":[17,24],"such":[18,33],"as":[19],"unseen":[20],"tumors":[21],"medical":[23,128],"causing":[25],"\"image":[26],"hallucination\"":[27],"and":[28,51,93,97,117,123,129],"risking":[29],"misdiagnosis.":[30],"We":[31,44],"hypothesize":[32],"hallucinations":[34,57],"result":[35],"from":[36],"local":[37],"OOD":[38,49,80,95],"regions":[39],"the":[41,48,126],"conditional":[42],"images.":[43],"verify":[45],"that":[46,69],"partitioning":[47],"region":[50],"conducting":[52],"separate":[53],"generations":[55],"alleviates":[56],"several":[59],"applications.":[60],"From":[61],"this,":[62],"we":[63],"propose":[64],"a":[65,86,98],"training-free":[66],"framework":[68],"reduces":[70],"hallucination":[71,112],"multiple":[73],"Local":[74],"Diffusion":[75],"processes.":[76],"Our":[77,106],"approach":[78],"involves":[79],"estimation":[81],"followed":[82],"by":[83,121],"two":[84],"modules:":[85],"\"branching\"":[87],"module":[88,100],"generates":[89],"locally":[90],"both":[91],"within":[92],"outside":[94],"regions,":[96],"\"fusion\"":[99],"integrates":[101],"these":[102],"predictions":[103],"into":[104],"one.":[105],"evaluation":[107],"shows":[108],"our":[109],"method":[110],"mitigates":[111],"over":[113],"baseline":[114],"quantitatively":[116],"qualitatively,":[118],"reducing":[119],"misdiagnosis":[120],"40%":[122],"25%":[124],"real-world":[127],"natural":[130],"datasets,":[132],"respectively.":[133],"It":[134],"also":[135],"demonstrates":[136],"compatibility":[137],"various":[139],"pre-trained":[140],"models.":[142]},"counts_by_year":[],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
