{"id":"https://openalex.org/W4402916446","doi":"https://doi.org/10.1109/tcsvt.2024.3469286","title":"Generative Transformer for Accurate and Reliable Salient Object Detection","display_name":"Generative Transformer for Accurate and Reliable Salient Object Detection","publication_year":2024,"publication_date":"2024-09-27","ids":{"openalex":"https://openalex.org/W4402916446","doi":"https://doi.org/10.1109/tcsvt.2024.3469286"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2024.3469286","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2024.3469286","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Yuxin Mao","orcid":"https://orcid.org/0000-0002-9239-091X"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuxin Mao","raw_affiliation_strings":["School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","Shaanxi Key Laboratory of Information Acquisition and Processing, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China"],"raw_orcid":"https://orcid.org/0000-0002-9239-091X","affiliations":[{"raw_affiliation_string":"School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]},{"raw_affiliation_string":"Shaanxi Key Laboratory of Information Acquisition and Processing, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100630815","display_name":"Jing Zhang","orcid":"https://orcid.org/0000-0002-8516-0913"},"institutions":[{"id":"https://openalex.org/I118347636","display_name":"Australian National University","ror":"https://ror.org/019wvm592","country_code":"AU","type":"education","lineage":["https://openalex.org/I118347636"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Jing Zhang","raw_affiliation_strings":["School of Computing, Australian National University, Canberra, Australia"],"raw_orcid":"https://orcid.org/0000-0002-8516-0913","affiliations":[{"raw_affiliation_string":"School of Computing, Australian National University, Canberra, Australia","institution_ids":["https://openalex.org/I118347636"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050347496","display_name":"Zhexiong Wan","orcid":"https://orcid.org/0000-0002-4494-6178"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhexiong Wan","raw_affiliation_strings":["School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","Shaanxi Key Laboratory of Information Acquisition and Processing, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China"],"raw_orcid":"https://orcid.org/0000-0002-4494-6178","affiliations":[{"raw_affiliation_string":"School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]},{"raw_affiliation_string":"Shaanxi Key Laboratory of Information Acquisition and Processing, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029944382","display_name":"Xinyu Tian","orcid":"https://orcid.org/0000-0003-1247-6076"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinyu Tian","raw_affiliation_strings":["School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","Shaanxi Key Laboratory of Information Acquisition and Processing, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]},{"raw_affiliation_string":"Shaanxi Key Laboratory of Information Acquisition and Processing, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Aixuan Li","orcid":"https://orcid.org/0009-0000-6868-2384"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Aixuan Li","raw_affiliation_strings":["School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","Shaanxi Key Laboratory of Information Acquisition and Processing, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China"],"raw_orcid":"https://orcid.org/0009-0000-6868-2384","affiliations":[{"raw_affiliation_string":"School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]},{"raw_affiliation_string":"Shaanxi Key Laboratory of Information Acquisition and Processing, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054874551","display_name":"Yunqiu Lv","orcid":null},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yunqiu Lv","raw_affiliation_strings":["School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","Shaanxi Key Laboratory of Information Acquisition and Processing, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]},{"raw_affiliation_string":"Shaanxi Key Laboratory of Information Acquisition and Processing, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5036202579","display_name":"Yuchao Dai","orcid":"https://orcid.org/0000-0002-4432-7406"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuchao Dai","raw_affiliation_strings":["School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","Shaanxi Key Laboratory of Information Acquisition and Processing, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China"],"raw_orcid":"https://orcid.org/0000-0002-4432-7406","affiliations":[{"raw_affiliation_string":"School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]},{"raw_affiliation_string":"Shaanxi Key Laboratory of Information Acquisition and Processing, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":6.7806,"has_fulltext":false,"cited_by_count":31,"citation_normalized_percentile":{"value":0.97814966,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"35","issue":"2","first_page":"1041","last_page":"1054"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12389","display_name":"Infrared Target Detection Methodologies","score":0.9496999979019165,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6437410116195679},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5512102246284485},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5471476912498474},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.49283862113952637},{"id":"https://openalex.org/keywords/salient","display_name":"Salient","score":0.44794395565986633},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.4368540644645691},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4329172968864441},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.13111558556556702}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6437410116195679},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5512102246284485},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5471476912498474},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.49283862113952637},{"id":"https://openalex.org/C2780719617","wikidata":"https://www.wikidata.org/wiki/Q1030752","display_name":"Salient","level":2,"score":0.44794395565986633},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.4368540644645691},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4329172968864441},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.13111558556556702},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tcsvt.2024.3469286","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2024.3469286","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},{"id":"pmh:oai:openresearch-repository.anu.edu.au:1885/733751894","is_oa":false,"landing_page_url":"http://www.scopus.com/inward/record.url?scp=85205319292&partnerID=8YFLogxK","pdf_url":null,"source":{"id":"https://openalex.org/S4306402539","display_name":"ANU Open Research (Australian National University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I118347636","host_organization_name":"Australian National University","host_organization_lineage":["https://openalex.org/I118347636"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"Journal article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/13","display_name":"Climate action","score":0.6200000047683716}],"awards":[{"id":"https://openalex.org/G3766433509","display_name":null,"funder_award_id":"62271410","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3858504019","display_name":null,"funder_award_id":"CX2024014","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":99,"referenced_works":["https://openalex.org/W845365781","https://openalex.org/W1894057436","https://openalex.org/W1901129140","https://openalex.org/W2002781701","https://openalex.org/W2039313011","https://openalex.org/W2086791339","https://openalex.org/W2108598243","https://openalex.org/W2128272608","https://openalex.org/W2171378720","https://openalex.org/W2194775991","https://openalex.org/W2519766107","https://openalex.org/W2740667773","https://openalex.org/W2744613561","https://openalex.org/W2778764040","https://openalex.org/W2780708736","https://openalex.org/W2798791651","https://openalex.org/W2799213142","https://openalex.org/W2897541487","https://openalex.org/W2904487290","https://openalex.org/W2948510860","https://openalex.org/W2950116990","https://openalex.org/W2954040150","https://openalex.org/W2961348656","https://openalex.org/W2963112696","https://openalex.org/W2963225012","https://openalex.org/W2963299740","https://openalex.org/W2963342032","https://openalex.org/W2963529609","https://openalex.org/W2963685207","https://openalex.org/W2963868681","https://openalex.org/W2964352379","https://openalex.org/W2979410457","https://openalex.org/W2980901882","https://openalex.org/W2987701848","https://openalex.org/W2990984982","https://openalex.org/W2996884277","https://openalex.org/W2997316506","https://openalex.org/W2998449272","https://openalex.org/W3002301267","https://openalex.org/W3034185160","https://openalex.org/W3034453930","https://openalex.org/W3035290198","https://openalex.org/W3035422681","https://openalex.org/W3096609285","https://openalex.org/W3107944836","https://openalex.org/W3113755791","https://openalex.org/W3122006940","https://openalex.org/W3131500599","https://openalex.org/W3138516171","https://openalex.org/W3147597595","https://openalex.org/W3149623420","https://openalex.org/W3154314696","https://openalex.org/W3154503495","https://openalex.org/W3165924482","https://openalex.org/W3170841864","https://openalex.org/W3173382343","https://openalex.org/W3179443972","https://openalex.org/W3197617356","https://openalex.org/W3200793272","https://openalex.org/W3205387145","https://openalex.org/W3207493400","https://openalex.org/W4214520160","https://openalex.org/W4214561053","https://openalex.org/W4214680709","https://openalex.org/W4214759957","https://openalex.org/W4226056010","https://openalex.org/W4239147634","https://openalex.org/W4241071816","https://openalex.org/W4285176133","https://openalex.org/W4289535682","https://openalex.org/W4293093495","https://openalex.org/W4293846201","https://openalex.org/W4310467366","https://openalex.org/W4312265121","https://openalex.org/W4312287801","https://openalex.org/W4366966982","https://openalex.org/W4380303870","https://openalex.org/W4385245566","https://openalex.org/W4386076434","https://openalex.org/W4387757595","https://openalex.org/W4387968414","https://openalex.org/W4390872864","https://openalex.org/W6637162671","https://openalex.org/W6637373629","https://openalex.org/W6640425456","https://openalex.org/W6640963894","https://openalex.org/W6683825394","https://openalex.org/W6687045409","https://openalex.org/W6739651123","https://openalex.org/W6748692255","https://openalex.org/W6748758124","https://openalex.org/W6752558437","https://openalex.org/W6757817989","https://openalex.org/W6758151150","https://openalex.org/W6765694979","https://openalex.org/W6768279175","https://openalex.org/W6784094891","https://openalex.org/W6784275809","https://openalex.org/W6803674551"],"related_works":["https://openalex.org/W2329500892","https://openalex.org/W28991112","https://openalex.org/W2370726991","https://openalex.org/W2369710579","https://openalex.org/W4327728159","https://openalex.org/W4394266730","https://openalex.org/W1990856605","https://openalex.org/W2053783616","https://openalex.org/W2545348020","https://openalex.org/W2912751582"],"abstract_inverted_index":{"We":[0,138],"explore":[1],"the":[2,17,34,54,58,68,72,84,90,95,98,118,153],"impact":[3],"of":[4,67,74,83,97],"transformers":[5],"on":[6],"accurate":[7,159],"and":[8,23,160,168],"reliable":[9,161],"salient":[10,146,162],"object":[11,147,163],"detection.":[12,164],"For":[13],"accuracy,":[14],"we":[15,32,47],"integrate":[16],"transformer":[18,55,154],"with":[19],"a":[20,49],"deterministic":[21],"model":[22,52],"delineate":[24],"its":[25],"advantages":[26],"in":[27],"structural":[28],"modeling.":[29],"Regarding":[30],"reliability,":[31],"address":[33],"transformer\u2019s":[35],"tendency":[36],"to":[37,132,143,157],"produce":[38],"overly":[39],"confident,":[40],"incorrect":[41],"predictions.":[42],"To":[43],"gauge":[44],"reliability":[45],"implicitly,":[46],"introduce":[48],"latent":[50,69,99,119,135],"variable":[51,70,100,120,136],"within":[53,152],"framework,":[56],"termed":[57],"inferential":[59],"generative":[60],"adversarial":[61],"network":[62],"(iGAN).":[63],"The":[64,114,165],"stochastic":[65],"nature":[66],"facilitates":[71],"estimation":[73],"predictive":[75],"uncertainty,":[76],"which":[77,93],"serves":[78],"as":[79,101],"an":[80,133],"auxiliary":[81],"measure":[82],"model\u2019s":[85],"prediction":[86],"reliability.":[87],"Different":[88],"from":[89],"conventional":[91],"GAN,":[92],"defines":[94],"distribution":[96,105],"fixed":[102],"standard":[103],"normal":[104],"<inline-formula":[106],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[107,179],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">":[108],"<tex-math":[109],"notation=\"LaTeX\">$\\mathcal":[110],"{N}(0,\\mathbf":[111],"{I})$":[112],"</tex-math></inline-formula>.":[113],"proposed":[115,141],"iGAN":[116,142,151],"infers":[117],"by":[121],"gradient-based":[122],"Markov":[123],"Chain":[124],"Monte":[125],"Carlo":[126],"(MCMC),":[127],"namely":[128],"Langevin":[129],"dynamics,":[130],"leading":[131],"input-dependent":[134],"model.":[137],"apply":[139],"our":[140,175],"fully":[144],"supervised":[145],"detection,":[148],"explaining":[149],"that":[150],"framework":[155],"leads":[156],"both":[158],"source":[166],"code":[167],"experimental":[169],"results":[170],"are":[171],"publicly":[172],"available":[173],"via":[174],"project":[176],"page:":[177],"<uri":[178],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">https://npucvr.github.io/TransformerSOD</uri>.":[180]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":22},{"year":2024,"cited_by_count":5}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
