{"id":"https://openalex.org/W4401577246","doi":"https://doi.org/10.3389/fcomp.2024.1420965","title":"Spatial attention guided cGAN for improved salient object detection","display_name":"Spatial attention guided cGAN for improved salient object detection","publication_year":2024,"publication_date":"2024-08-14","ids":{"openalex":"https://openalex.org/W4401577246","doi":"https://doi.org/10.3389/fcomp.2024.1420965"},"language":"en","primary_location":{"id":"doi:10.3389/fcomp.2024.1420965","is_oa":true,"landing_page_url":"https://doi.org/10.3389/fcomp.2024.1420965","pdf_url":"https://www.frontiersin.org/journals/computer-science/articles/10.3389/fcomp.2024.1420965/pdf","source":{"id":"https://openalex.org/S4210211086","display_name":"Frontiers in Computer Science","issn_l":"2624-9898","issn":["2624-9898"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320527","host_organization_name":"Frontiers Media","host_organization_lineage":["https://openalex.org/P4310320527"],"host_organization_lineage_names":["Frontiers Media"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Computer Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.frontiersin.org/journals/computer-science/articles/10.3389/fcomp.2024.1420965/pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007552220","display_name":"Gayathri Dhara","orcid":"https://orcid.org/0000-0002-2182-8718"},"institutions":[{"id":"https://openalex.org/I4210131147","display_name":"SRM University","ror":"https://ror.org/037skf023","country_code":"IN","type":"education","lineage":["https://openalex.org/I145286018","https://openalex.org/I4210131147"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Gayathri Dhara","raw_affiliation_strings":["Department of Computer Science and Engineering (CSE), SRM University, Amaravathi, Andhra Pradesh, India"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering (CSE), SRM University, Amaravathi, Andhra Pradesh, India","institution_ids":["https://openalex.org/I4210131147"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100521148","display_name":"Ravi Kant Kumar","orcid":"https://orcid.org/0000-0003-0621-7692"},"institutions":[{"id":"https://openalex.org/I4210131147","display_name":"SRM University","ror":"https://ror.org/037skf023","country_code":"IN","type":"education","lineage":["https://openalex.org/I145286018","https://openalex.org/I4210131147"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Ravi Kant Kumar","raw_affiliation_strings":["Department of Computer Science and Engineering (CSE), SRM University, Amaravathi, Andhra Pradesh, India"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering (CSE), SRM University, Amaravathi, Andhra Pradesh, India","institution_ids":["https://openalex.org/I4210131147"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5100521148"],"corresponding_institution_ids":["https://openalex.org/I4210131147"],"apc_list":{"value":1150,"currency":"USD","value_usd":1150},"apc_paid":{"value":1150,"currency":"USD","value_usd":1150},"fwci":2.0291,"has_fulltext":true,"cited_by_count":8,"citation_normalized_percentile":{"value":0.8801041,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"6","issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11094","display_name":"Face Recognition and Perception","score":0.9611999988555908,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminator","display_name":"Discriminator","score":0.8287314176559448},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7443715333938599},{"id":"https://openalex.org/keywords/salient","display_name":"Salient","score":0.7252299785614014},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.676409125328064},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6378412246704102},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5655754804611206},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.548066258430481},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4845534861087799},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4752488136291504},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4690910577774048},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.45507800579071045},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4400354325771332}],"concepts":[{"id":"https://openalex.org/C2779803651","wikidata":"https://www.wikidata.org/wiki/Q5282088","display_name":"Discriminator","level":3,"score":0.8287314176559448},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7443715333938599},{"id":"https://openalex.org/C2780719617","wikidata":"https://www.wikidata.org/wiki/Q1030752","display_name":"Salient","level":2,"score":0.7252299785614014},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.676409125328064},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6378412246704102},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5655754804611206},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.548066258430481},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4845534861087799},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4752488136291504},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4690910577774048},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.45507800579071045},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4400354325771332},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3389/fcomp.2024.1420965","is_oa":true,"landing_page_url":"https://doi.org/10.3389/fcomp.2024.1420965","pdf_url":"https://www.frontiersin.org/journals/computer-science/articles/10.3389/fcomp.2024.1420965/pdf","source":{"id":"https://openalex.org/S4210211086","display_name":"Frontiers in Computer Science","issn_l":"2624-9898","issn":["2624-9898"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320527","host_organization_name":"Frontiers Media","host_organization_lineage":["https://openalex.org/P4310320527"],"host_organization_lineage_names":["Frontiers Media"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Computer Science","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:6e45de33ef1541d78ab66ba2b0e180a9","is_oa":true,"landing_page_url":"https://doaj.org/article/6e45de33ef1541d78ab66ba2b0e180a9","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Frontiers in Computer Science, Vol 6 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.3389/fcomp.2024.1420965","is_oa":true,"landing_page_url":"https://doi.org/10.3389/fcomp.2024.1420965","pdf_url":"https://www.frontiersin.org/journals/computer-science/articles/10.3389/fcomp.2024.1420965/pdf","source":{"id":"https://openalex.org/S4210211086","display_name":"Frontiers in Computer Science","issn_l":"2624-9898","issn":["2624-9898"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320527","host_organization_name":"Frontiers Media","host_organization_lineage":["https://openalex.org/P4310320527"],"host_organization_lineage_names":["Frontiers Media"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Computer Science","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.6399999856948853,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320317486","display_name":"SRM Institute of Science and Technology","ror":"https://ror.org/037skf023"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4401577246.pdf"},"referenced_works_count":73,"referenced_works":["https://openalex.org/W21025885","https://openalex.org/W1497599070","https://openalex.org/W1686810756","https://openalex.org/W1923697677","https://openalex.org/W1982075130","https://openalex.org/W1996326832","https://openalex.org/W2014467472","https://openalex.org/W2055289854","https://openalex.org/W2149095485","https://openalex.org/W2161236525","https://openalex.org/W2164084182","https://openalex.org/W2294182682","https://openalex.org/W2412782625","https://openalex.org/W2508330216","https://openalex.org/W2559597482","https://openalex.org/W2559655401","https://openalex.org/W2604272474","https://openalex.org/W2630837129","https://openalex.org/W2740667773","https://openalex.org/W2887745158","https://openalex.org/W2894469712","https://openalex.org/W2896335074","https://openalex.org/W2908622466","https://openalex.org/W2940700666","https://openalex.org/W2963529609","https://openalex.org/W2963868681","https://openalex.org/W2963881378","https://openalex.org/W2981000764","https://openalex.org/W2997110625","https://openalex.org/W2997316506","https://openalex.org/W2998449272","https://openalex.org/W3010136160","https://openalex.org/W3025800305","https://openalex.org/W3083291461","https://openalex.org/W3122006940","https://openalex.org/W3163079050","https://openalex.org/W3177087374","https://openalex.org/W3185489052","https://openalex.org/W4236965008","https://openalex.org/W4239147634","https://openalex.org/W4295521014","https://openalex.org/W4301409532","https://openalex.org/W4320013936","https://openalex.org/W4371766314","https://openalex.org/W6620707391","https://openalex.org/W6623430341","https://openalex.org/W6639824700","https://openalex.org/W6660344663","https://openalex.org/W6662642246","https://openalex.org/W6672295943","https://openalex.org/W6675026286","https://openalex.org/W6678459986","https://openalex.org/W6683766560","https://openalex.org/W6684191040","https://openalex.org/W6684406275","https://openalex.org/W6687483927","https://openalex.org/W6729966448","https://openalex.org/W6730342312","https://openalex.org/W6735913928","https://openalex.org/W6737324727","https://openalex.org/W6741832134","https://openalex.org/W6742002635","https://openalex.org/W6742879749","https://openalex.org/W6748481559","https://openalex.org/W6749312877","https://openalex.org/W6750983645","https://openalex.org/W6765841262","https://openalex.org/W6766759761","https://openalex.org/W6770614152","https://openalex.org/W6772117364","https://openalex.org/W6779767817","https://openalex.org/W6795857834","https://openalex.org/W6856125862"],"related_works":["https://openalex.org/W4293202849","https://openalex.org/W1980965563","https://openalex.org/W1489300767","https://openalex.org/W2387995142","https://openalex.org/W4380714744","https://openalex.org/W4319453655","https://openalex.org/W2089959425","https://openalex.org/W2057775761","https://openalex.org/W2964074194","https://openalex.org/W2366944513"],"abstract_inverted_index":{"Recent":[0],"research":[1],"shows":[2],"that":[3,21],"Conditional":[4],"Generative":[5],"Adversarial":[6],"Networks":[7],"(cGANs)":[8],"are":[9,64,224,301],"effective":[10],"for":[11,37,59,82,107,122,229,274,351],"Salient":[12],"Object":[13],"Detection":[14],"(SOD),":[15],"a":[16,110],"challenging":[17,60,327],"computer":[18],"vision":[19,26],"task":[20,39],"mimics":[22],"the":[23,80,119,125,134,142,148,152,157,171,189,195,204,227,236,247,252,259,309,315,320,326],"way":[24],"human":[25],"focuses":[27],"on":[28,291,314,319,325],"important":[29],"parts":[30],"of":[31,87,95,133,150,183],"an":[32,104],"image.":[33],"However,":[34],"implementing":[35],"cGANs":[36,88],"this":[38],"has":[40],"presented":[41],"several":[42],"complexities,":[43],"including":[44],"instability":[45],"during":[46],"training":[47,144,158,246],"with":[48,69,175],"skip":[49],"connections,":[50],"weak":[51],"generators,":[52],"and":[53,85,93,129,155,179,191,199,231,249,264,281,297,323,328],"difficulty":[54],"in":[55,188,257,343],"capturing":[56],"context":[57],"information":[58],"images.":[61],"These":[62],"challenges":[63],"particularly":[65],"evident":[66],"when":[67],"dealing":[68],"input":[70],"images":[71],"containing":[72],"small":[73],"salient":[74,96,135,153,260,275,344],"objects":[75,154],"against":[76],"complex":[77,329],"backgrounds,":[78],"underscoring":[79],"need":[81],"careful":[83],"design":[84],"tuning":[86],"to":[89,146,216,234,239,303,333],"ensure":[90],"accurate":[91,131],"segmentation":[92,132],"detection":[94],"objects.":[97,136],"To":[98],"address":[99],"these":[100,292],"issues,":[101],"we":[102],"propose":[103],"innovative":[105],"method":[106,114,307,339],"SOD":[108],"using":[109,268,287],"cGAN":[111,143],"framework.":[112],"Our":[113,283,306,337],"utilizes":[115],"encoder-decoder":[116],"framework":[117],"as":[118],"generator":[120,250],"component":[121],"cGAN,":[123],"enhancing":[124],"feature":[126,214],"extraction":[127],"process":[128,145],"facilitating":[130],"We":[137,262],"incorporate":[138],"Wasserstein-1":[139],"distance":[140],"within":[141],"improve":[147],"accuracy":[149],"finding":[151,258],"stabilize":[156],"process.":[159],"Additionally,":[160],"our":[161,266],"enhanced":[162],"model":[163,253,267],"efficiently":[164],"captures":[165],"intricate":[166],"saliency":[167,218,222,242],"cues":[168],"by":[169,209,226],"leveraging":[170],"spatial":[172],"attention":[173,206],"gate":[174],"global":[176,184,197],"average":[177,185],"pooling":[178,186],"regularization.":[180],"The":[181,220],"introduction":[182],"layers":[187],"encoder":[190],"decoder":[192],"paths":[193],"enhances":[194],"network's":[196],"perception":[198],"fine-grained":[200],"detail":[201],"capture,":[202],"while":[203],"channel":[205],"mechanism,":[207],"facilitated":[208],"dense":[210],"layers,":[211],"dynamically":[212],"modulates":[213],"maps":[215,223],"amplify":[217],"cues.":[219],"generated":[221],"evaluated":[225,286],"discriminator":[228,248],"authenticity":[230],"gives":[232],"feedback":[233],"enhance":[235],"generator's":[237],"ability":[238],"generate":[240],"high-resolution":[241],"maps.":[243],"By":[244],"iteratively":[245],"networks,":[251],"achieves":[254],"improved":[255],"results":[256],"object.":[261],"trained":[263],"validated":[265],"large-scale":[269],"benchmark":[270],"datasets":[271],"commonly":[272],"used":[273,302],"object":[276,345],"detection,":[277,346],"namely":[278],"DUTS,":[279],"ECSSD,":[280],"DUT-OMRON.":[282],"approach":[284],"was":[285],"standard":[288],"performance":[289],"metrics":[290,300],"datasets.":[293],"Precision,":[294],"recall,":[295],"MAE":[296,311],"F\u03b2":[298],"score":[299],"evaluate":[304],"performance.":[305],"achieved":[308],"lowest":[310],"values:":[312],"0.0292":[313],"ECSSD":[316],"dataset,":[317,322,331],"0.033":[318],"DUTS-TE":[321],"0.0439":[324],"DUT-OMRON":[330],"compared":[332],"other":[334],"state-of-the-art":[335],"methods.":[336],"proposed":[338],"demonstrates":[340],"significant":[341],"improvements":[342],"highlighting":[347],"its":[348],"potential":[349],"benefits":[350],"real-life":[352],"applications.":[353]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":2}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
