{"id":"https://openalex.org/W3012287122","doi":"https://doi.org/10.1109/iros45743.2020.9341574","title":"Tidying Deep Saliency Prediction Architectures","display_name":"Tidying Deep Saliency Prediction Architectures","publication_year":2020,"publication_date":"2020-10-24","ids":{"openalex":"https://openalex.org/W3012287122","doi":"https://doi.org/10.1109/iros45743.2020.9341574","mag":"3012287122"},"language":"en","primary_location":{"id":"doi:10.1109/iros45743.2020.9341574","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros45743.2020.9341574","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2003.04942","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108738702","display_name":"Navyasri Reddy","orcid":null},"institutions":[{"id":"https://openalex.org/I188963388","display_name":"International Institute of Information Technology","ror":"https://ror.org/02dernx73","country_code":"IN","type":"education","lineage":["https://openalex.org/I188963388"]},{"id":"https://openalex.org/I64189192","display_name":"International Institute of Information Technology, Hyderabad","ror":"https://ror.org/05f11g639","country_code":"IN","type":"education","lineage":["https://openalex.org/I64189192"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Navyasri Reddy","raw_affiliation_strings":["International Institute of Information Technology,CVIT, KCIS,Hyderabad,India","International Institute of Information Technology, Hyderabad;"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"International Institute of Information Technology,CVIT, KCIS,Hyderabad,India","institution_ids":["https://openalex.org/I188963388"]},{"raw_affiliation_string":"International Institute of Information Technology, Hyderabad;","institution_ids":["https://openalex.org/I64189192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101608990","display_name":"Samyak Jain","orcid":null},"institutions":[{"id":"https://openalex.org/I188963388","display_name":"International Institute of Information Technology","ror":"https://ror.org/02dernx73","country_code":"IN","type":"education","lineage":["https://openalex.org/I188963388"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Samyak Jain","raw_affiliation_strings":["International Institute of Information Technology,CVIT, KCIS,Hyderabad,India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"International Institute of Information Technology,CVIT, KCIS,Hyderabad,India","institution_ids":["https://openalex.org/I188963388"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019427210","display_name":"Pradeep Yarlagadda","orcid":null},"institutions":[{"id":"https://openalex.org/I188963388","display_name":"International Institute of Information Technology","ror":"https://ror.org/02dernx73","country_code":"IN","type":"education","lineage":["https://openalex.org/I188963388"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Pradeep Yarlagadda","raw_affiliation_strings":["International Institute of Information Technology,CVIT, KCIS,Hyderabad,India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"International Institute of Information Technology,CVIT, KCIS,Hyderabad,India","institution_ids":["https://openalex.org/I188963388"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5067298540","display_name":"Vineet Gandhi","orcid":"https://orcid.org/0000-0001-8861-7731"},"institutions":[{"id":"https://openalex.org/I188963388","display_name":"International Institute of Information Technology","ror":"https://ror.org/02dernx73","country_code":"IN","type":"education","lineage":["https://openalex.org/I188963388"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Vineet Gandhi","raw_affiliation_strings":["International Institute of Information Technology,CVIT, KCIS,Hyderabad,India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"International Institute of Information Technology,CVIT, KCIS,Hyderabad,India","institution_ids":["https://openalex.org/I188963388"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.3916,"has_fulltext":true,"cited_by_count":4,"citation_normalized_percentile":{"value":0.60504716,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.970300018787384,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.8585940599441528},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7853686809539795},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7143591642379761},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7055871486663818},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.6038243770599365},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5486666560173035},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.5361189246177673},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5359993577003479},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.47760793566703796},{"id":"https://openalex.org/keywords/parametric-statistics","display_name":"Parametric statistics","score":0.44571825861930847},{"id":"https://openalex.org/keywords/cognitive-architecture","display_name":"Cognitive architecture","score":0.44476282596588135},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4258020222187042},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4188958406448364},{"id":"https://openalex.org/keywords/cognition","display_name":"Cognition","score":0.2506433129310608}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.8585940599441528},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7853686809539795},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7143591642379761},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7055871486663818},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.6038243770599365},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5486666560173035},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.5361189246177673},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5359993577003479},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.47760793566703796},{"id":"https://openalex.org/C117251300","wikidata":"https://www.wikidata.org/wiki/Q1849855","display_name":"Parametric statistics","level":2,"score":0.44571825861930847},{"id":"https://openalex.org/C20854674","wikidata":"https://www.wikidata.org/wiki/Q4386060","display_name":"Cognitive architecture","level":3,"score":0.44476282596588135},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4258020222187042},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4188958406448364},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.2506433129310608},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/iros45743.2020.9341574","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros45743.2020.9341574","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2003.04942","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2003.04942","pdf_url":"https://arxiv.org/pdf/2003.04942","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},{"id":"mag:3012287122","is_oa":true,"landing_page_url":"http://export.arxiv.org/pdf/2003.04942","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.2003.04942","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2003.04942","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2003.04942","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2003.04942","pdf_url":"https://arxiv.org/pdf/2003.04942","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"sustainable_development_goals":[{"score":0.5699999928474426,"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3012287122.pdf","grobid_xml":"https://content.openalex.org/works/W3012287122.grobid-xml"},"referenced_works_count":53,"referenced_works":["https://openalex.org/W1497599070","https://openalex.org/W1510835000","https://openalex.org/W1579853615","https://openalex.org/W1686810756","https://openalex.org/W1894057436","https://openalex.org/W1901129140","https://openalex.org/W1934890906","https://openalex.org/W1946606198","https://openalex.org/W2084098959","https://openalex.org/W2103666701","https://openalex.org/W2128272608","https://openalex.org/W2136790002","https://openalex.org/W2138046011","https://openalex.org/W2156142145","https://openalex.org/W2163605009","https://openalex.org/W2194775991","https://openalex.org/W2212216676","https://openalex.org/W2520859141","https://openalex.org/W2528092473","https://openalex.org/W2557536990","https://openalex.org/W2558906385","https://openalex.org/W2738450183","https://openalex.org/W2792609362","https://openalex.org/W2883347677","https://openalex.org/W2884775172","https://openalex.org/W2905233731","https://openalex.org/W2950519432","https://openalex.org/W2963446712","https://openalex.org/W2963503775","https://openalex.org/W2963623071","https://openalex.org/W2963828885","https://openalex.org/W2964081807","https://openalex.org/W2964114039","https://openalex.org/W2965685044","https://openalex.org/W3005401190","https://openalex.org/W3022565501","https://openalex.org/W3101840568","https://openalex.org/W3105966669","https://openalex.org/W3122238731","https://openalex.org/W6634817459","https://openalex.org/W6637373629","https://openalex.org/W6639359414","https://openalex.org/W6639824700","https://openalex.org/W6640683721","https://openalex.org/W6675836893","https://openalex.org/W6684191040","https://openalex.org/W6726906885","https://openalex.org/W6750375828","https://openalex.org/W6753053721","https://openalex.org/W6766857745","https://openalex.org/W6777463027","https://openalex.org/W6786277579","https://openalex.org/W6788940246"],"related_works":["https://openalex.org/W3132652652","https://openalex.org/W2890484038","https://openalex.org/W1946606198","https://openalex.org/W3005401190","https://openalex.org/W2775320731","https://openalex.org/W3095702468","https://openalex.org/W2914856806","https://openalex.org/W1532718000","https://openalex.org/W2982166103","https://openalex.org/W3127043518","https://openalex.org/W3035856201","https://openalex.org/W2944209449","https://openalex.org/W3095982069","https://openalex.org/W2981335848","https://openalex.org/W2962919941","https://openalex.org/W2996699350","https://openalex.org/W2902904290","https://openalex.org/W2891778567","https://openalex.org/W3135463655","https://openalex.org/W2744014255"],"abstract_inverted_index":{"Learning":[0],"computational":[1],"models":[2,52,92,179,194],"for":[3,188],"visual":[4,17],"attention":[5],"(saliency":[6],"estimation)":[7],"is":[8,134,153,166],"an":[9,135],"effort":[10],"to":[11,15,49,168,172],"inch":[12],"machines/robots":[13],"closer":[14],"human":[16],"cognitive":[18],"abilities.":[19],"Data-driven":[20],"efforts":[21],"have":[22],"dominated":[23],"the":[24,27,38,60,86,90,126,145,173],"landscape":[25],"since":[26],"introduction":[28],"of":[29,71,89,125,161],"deep":[30,35],"neural":[31],"network":[32],"architectures.":[33],"In":[34,63],"learning":[36],"research,":[37],"choices":[39],"in":[40,57],"architecture":[41,138],"design":[42],"are":[43,117,195],"often":[44],"empirical":[45],"and":[46,81,97,100,114,122,139,165,192],"frequently":[47],"lead":[48],"more":[50,120,170],"complex":[51],"than":[53],"necessary.":[54],"The":[55,176],"complexity,":[56],"turn,":[58],"hinders":[59],"application":[61],"requirements.":[62],"this":[64],"paper,":[65],"we":[66,106],"identify":[67],"four":[68,95],"key":[69],"components":[70,96],"saliency":[72,131,150,178],"models,":[73],"i.e.,":[74],"input":[75],"features,":[76],"multi-level":[77],"integration,":[78],"readout":[79],"architecture,":[80],"loss":[82],"functions.":[83],"We":[84],"review":[85],"existing":[87],"state":[88,124],"art":[91,127],"on":[93,129,144],"these":[94],"propose":[98,107],"novel":[99,109],"simpler":[101],"alternatives.":[102],"As":[103],"a":[104,154,162],"result,":[105],"two":[108],"end-to-end":[110],"architectures":[111],"called":[112],"SimpleNet":[113,133],"MDNSal,":[115],"which":[116],"neater,":[118],"minimal,":[119],"interpretable":[121],"achieve":[123],"performance":[128,142],"public":[130],"benchmarks.":[132],"optimized":[136],"encoder-decoder":[137],"brings":[140],"notable":[141],"gains":[143],"SALICON":[146],"dataset":[147],"(the":[148],"largest":[149],"benchmark).":[151],"MDNSal":[152],"parametric":[155],"model":[156],"that":[157],"directly":[158],"predicts":[159],"parameters":[160],"GMM":[163],"distribution":[164],"aimed":[167],"bring":[169],"interpretability":[171],"prediction":[174],"maps.":[175],"proposed":[177],"can":[180],"be":[181],"inferred":[182],"at":[183,197],"25fps,":[184],"making":[185],"them":[186],"suitable":[187],"real-time":[189],"applications.":[190],"Code":[191],"pre-trained":[193],"available":[196],"https://github.com/samyak0210/saliency.":[198]},"counts_by_year":[{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
