{"id":"https://openalex.org/W4396753518","doi":"https://doi.org/10.1109/tcsvt.2024.3398145","title":"Detail-Preserving and Diverse Image Translation for Adverse Visual Object Detection","display_name":"Detail-Preserving and Diverse Image Translation for Adverse Visual Object Detection","publication_year":2024,"publication_date":"2024-05-08","ids":{"openalex":"https://openalex.org/W4396753518","doi":"https://doi.org/10.1109/tcsvt.2024.3398145"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2024.3398145","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/tcsvt.2024.3398145","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009670425","display_name":"Guolong Sun","orcid":"https://orcid.org/0009-0000-4517-8038"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Guolong Sun","raw_affiliation_strings":["School of Artificial Intelligence, OPtics and ElectroNics (iOPEN), Northwestern Polytechnical University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, OPtics and ElectroNics (iOPEN), Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022524675","display_name":"Zhitong Xiong","orcid":"https://orcid.org/0000-0002-3953-585X"},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Zhitong Xiong","raw_affiliation_strings":["Chair of Data Science in Earth Observation, Technical University of Munich (TUM), Munich, Germany"],"affiliations":[{"raw_affiliation_string":"Chair of Data Science in Earth Observation, Technical University of Munich (TUM), Munich, Germany","institution_ids":["https://openalex.org/I62916508"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100334740","display_name":"Yuan Yuan","orcid":null},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuan Yuan","raw_affiliation_strings":["School of Artificial Intelligence, OPtics and ElectroNics (iOPEN), Northwestern Polytechnical University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, OPtics and ElectroNics (iOPEN), Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5009670425"],"corresponding_institution_ids":["https://openalex.org/I17145004"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0545648,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"34","issue":"10","first_page":"9139","last_page":"9152"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9879000186920166,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9879000186920166,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9807999730110168,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.979200005531311,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7023237347602844},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6591832041740417},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.6533176302909851},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6134025454521179},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5942461490631104},{"id":"https://openalex.org/keywords/image-processing","display_name":"Image processing","score":0.43714994192123413},{"id":"https://openalex.org/keywords/image-translation","display_name":"Image translation","score":0.4319276809692383},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.43165087699890137},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4148321747779846},{"id":"https://openalex.org/keywords/object-class-detection","display_name":"Object-class detection","score":0.41190606355667114},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3006928563117981},{"id":"https://openalex.org/keywords/face-detection","display_name":"Face detection","score":0.09627020359039307}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7023237347602844},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6591832041740417},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.6533176302909851},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6134025454521179},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5942461490631104},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.43714994192123413},{"id":"https://openalex.org/C2779757391","wikidata":"https://www.wikidata.org/wiki/Q6002292","display_name":"Image translation","level":3,"score":0.4319276809692383},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.43165087699890137},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4148321747779846},{"id":"https://openalex.org/C71681937","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object-class detection","level":5,"score":0.41190606355667114},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3006928563117981},{"id":"https://openalex.org/C4641261","wikidata":"https://www.wikidata.org/wiki/Q11681085","display_name":"Face detection","level":4,"score":0.09627020359039307},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C31510193","wikidata":"https://www.wikidata.org/wiki/Q1192553","display_name":"Facial recognition system","level":3,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2024.3398145","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/tcsvt.2024.3398145","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1195665351","display_name":null,"funder_award_id":"2020YFB2103900","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G2210533046","display_name":null,"funder_award_id":"61825603","funder_id":"https://openalex.org/F4320336125","funder_display_name":"National Science Fund for Distinguished Young Scholars"}],"funders":[{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null},{"id":"https://openalex.org/F4320336125","display_name":"National Science Fund for Distinguished Young Scholars","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":80,"referenced_works":["https://openalex.org/W1640745651","https://openalex.org/W1901129140","https://openalex.org/W2054814429","https://openalex.org/W2116973876","https://openalex.org/W2150461190","https://openalex.org/W2187089797","https://openalex.org/W2254039850","https://openalex.org/W2538864697","https://openalex.org/W2545656684","https://openalex.org/W2566376500","https://openalex.org/W2593414223","https://openalex.org/W2735974062","https://openalex.org/W2798799804","https://openalex.org/W2887817889","https://openalex.org/W2894931878","https://openalex.org/W2912512021","https://openalex.org/W2949187370","https://openalex.org/W2952056941","https://openalex.org/W2962793481","https://openalex.org/W2963516811","https://openalex.org/W2963920537","https://openalex.org/W2964115968","https://openalex.org/W2968634921","https://openalex.org/W2982770724","https://openalex.org/W2989045104","https://openalex.org/W2989236540","https://openalex.org/W2996290406","https://openalex.org/W3034305572","https://openalex.org/W3034779842","https://openalex.org/W3035175896","https://openalex.org/W3035564946","https://openalex.org/W3035731588","https://openalex.org/W3082125592","https://openalex.org/W3107259129","https://openalex.org/W3107989310","https://openalex.org/W3108910236","https://openalex.org/W3115000224","https://openalex.org/W3118035304","https://openalex.org/W3124817676","https://openalex.org/W3125028070","https://openalex.org/W3129242782","https://openalex.org/W3166409449","https://openalex.org/W3174908463","https://openalex.org/W3176493691","https://openalex.org/W3179888767","https://openalex.org/W3181722447","https://openalex.org/W3194643899","https://openalex.org/W3195892675","https://openalex.org/W3207919963","https://openalex.org/W3208798508","https://openalex.org/W4205932092","https://openalex.org/W4220784517","https://openalex.org/W4226178953","https://openalex.org/W4226367752","https://openalex.org/W4304141717","https://openalex.org/W4312052506","https://openalex.org/W4312249431","https://openalex.org/W4312287126","https://openalex.org/W4312461295","https://openalex.org/W4312713178","https://openalex.org/W4312902661","https://openalex.org/W4312993742","https://openalex.org/W4313160378","https://openalex.org/W4322707256","https://openalex.org/W4360584634","https://openalex.org/W4367301647","https://openalex.org/W4383109290","https://openalex.org/W4385326867","https://openalex.org/W4385420965","https://openalex.org/W4386066209","https://openalex.org/W4386212341","https://openalex.org/W4386702642","https://openalex.org/W4389371446","https://openalex.org/W6620707391","https://openalex.org/W6640174519","https://openalex.org/W6729110096","https://openalex.org/W6733814495","https://openalex.org/W6750759024","https://openalex.org/W6770444568","https://openalex.org/W6811253114"],"related_works":["https://openalex.org/W2901758161","https://openalex.org/W4205668735","https://openalex.org/W4288069866","https://openalex.org/W4389232935","https://openalex.org/W3155045749","https://openalex.org/W3204852000","https://openalex.org/W3126664501","https://openalex.org/W3209429418","https://openalex.org/W4297540035","https://openalex.org/W4312834249"],"abstract_inverted_index":{"The":[0,94],"effectiveness":[1],"of":[2,97,126,139,160,182,188,200],"object":[3,248],"detection":[4,190,249],"is":[5,15,170],"significantly":[6],"hampered":[7],"in":[8,49,66,130,203,250],"challenging":[9,128,215],"nighttime":[10],"or":[11],"rainy":[12,60],"scenarios.":[13],"This":[14,120],"due":[16],"to":[17,149,234],"the":[18,67,123,137,140,158,179,186,189,197,205,219],"severe":[19],"domain":[20,42,86,239],"shifts":[21,87],"between":[22,178],"daytime":[23],"and":[24,91,116,185,228,237],"adverse-visual":[25],"images.":[26,93],"Previous":[27],"methods":[28,35,222],"have":[29],"demonstrated":[30],"that":[31,84],"using":[32],"image-to-image":[33],"translation":[34],"for":[36,247],"data":[37],"augmentation":[38],"can":[39,230],"effectively":[40],"address":[41],"shifts,":[43],"but":[44,165],"they":[45],"may":[46],"still":[47],"fail":[48],"preserving":[50],"image":[51],"objects":[52],"when":[53],"faced":[54],"with":[55],"extreme":[56],"adverse":[57,251],"images":[58,129,184],"like":[59],"nights.":[61],"In":[62],"addition,":[63],"achieving":[64],"diversity":[65,159,181,202],"generated":[68],"results":[69],"remains":[70],"challenging.":[71],"To":[72,135,156],"this":[73,98],"end,":[74],"we":[75,142],"propose":[76,105],"a":[77,106,117,131,163,175,193,244],"Progressive":[78],"Adverse":[79],"Image":[80],"Translation":[81],"(PAIT)":[82],"framework":[83,121,209],"tackles":[85],"by":[88,223],"generating":[89],"diverse":[90],"detail-preserving":[92],"main":[95],"contributions":[96],"paper":[99],"are":[100],"as":[101],"follows.":[102],"1)":[103],"We":[104,173],"novel":[107],"PAIT":[108],"framework,":[109],"which":[110],"incorporates":[111],"an":[112,145],"iterative":[113,146],"mapping":[114,147],"module":[115,148],"slicing":[118],"layer.":[119],"enables":[122],"progressive":[124],"generation":[125],"increasingly":[127],"fine-to-coarse":[132],"manner.":[133],"2)":[134],"preserve":[136],"details":[138],"images,":[141,162],"innovatively":[143],"introduce":[144],"generate":[150],"smooth":[151],"style":[152,180,201],"transform":[153],"curves.":[154],"3)":[155],"enhance":[157],"synthesized":[161],"simple":[164],"efficient":[166],"end-to-end":[167],"optimization":[168],"method":[169],"proposed.":[171],"4)":[172],"found":[174],"strong":[176],"correlation":[177],"augmented":[183],"performance":[187,212],"model":[191],"through":[192],"quantitative":[194],"analysis,":[195],"highlighting":[196],"crucial":[198],"role":[199],"enhancing":[204],"model\u2019s":[206],"generalizability.":[207],"Our":[208,254],"achieves":[210],"state-of-the-art":[211,221],"on":[213],"multiple":[214],"visual":[216,252],"datasets,":[217],"surpassing":[218],"current":[220],"27%(+8.0AP).":[224],"Moreover,":[225],"our":[226],"approach":[227],"modules":[229],"be":[231,257],"easily":[232],"extended":[233],"different":[235],"detectors":[236],"other":[238],"adaptation":[240],"methods,":[241],"making":[242],"it":[243],"versatile":[245],"solution":[246],"environments.":[253],"code":[255],"will":[256],"available":[258],"at":[259],"<uri":[260],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[261],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">https://github.com/ssunguotu/Diverse-Aug</uri>.":[262]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
