{"id":"https://openalex.org/W2402640619","doi":"https://doi.org/10.1109/icassp.2016.7472018","title":"Automatic image region annotation through segmentation based visual semantic analysis and discriminative classification","display_name":"Automatic image region annotation through segmentation based visual semantic analysis and discriminative classification","publication_year":2016,"publication_date":"2016-03-01","ids":{"openalex":"https://openalex.org/W2402640619","doi":"https://doi.org/10.1109/icassp.2016.7472018","mag":"2402640619"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2016.7472018","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2016.7472018","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073219155","display_name":"Jing Zhang","orcid":"https://orcid.org/0000-0002-0171-0683"},"institutions":[{"id":"https://openalex.org/I143593769","display_name":"East China University of Science and Technology","ror":"https://ror.org/01vyrm377","country_code":"CN","type":"education","lineage":["https://openalex.org/I143593769"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jing Zhang","raw_affiliation_strings":["Department of Computer Science and Engineering, East China University of Science and Technology, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, East China University of Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I143593769"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051966001","display_name":"Yongwei Gao","orcid":"https://orcid.org/0000-0001-7026-9273"},"institutions":[{"id":"https://openalex.org/I143593769","display_name":"East China University of Science and Technology","ror":"https://ror.org/01vyrm377","country_code":"CN","type":"education","lineage":["https://openalex.org/I143593769"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongwei Gao","raw_affiliation_strings":["Department of Computer Science and Engineering, East China University of Science and Technology, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, East China University of Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I143593769"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085209535","display_name":"Shengwei Feng","orcid":null},"institutions":[{"id":"https://openalex.org/I143593769","display_name":"East China University of Science and Technology","ror":"https://ror.org/01vyrm377","country_code":"CN","type":"education","lineage":["https://openalex.org/I143593769"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shengwei Feng","raw_affiliation_strings":["Department of Computer Science and Engineering, East China University of Science and Technology, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, East China University of Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I143593769"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046428374","display_name":"Yubo Yuan","orcid":"https://orcid.org/0000-0002-7577-3257"},"institutions":[{"id":"https://openalex.org/I143593769","display_name":"East China University of Science and Technology","ror":"https://ror.org/01vyrm377","country_code":"CN","type":"education","lineage":["https://openalex.org/I143593769"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yubo Yuan","raw_affiliation_strings":["Department of Computer Science and Engineering, East China University of Science and Technology, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, East China University of Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I143593769"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066868860","display_name":"Chin\u2010Hui Lee","orcid":"https://orcid.org/0000-0002-1892-2551"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chin-Hui Lee","raw_affiliation_strings":["School of Electrical and Computer Engineering, Georgia Institute of Technology, Atlanta, GA, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5073219155"],"corresponding_institution_ids":["https://openalex.org/I143593769"],"apc_list":null,"apc_paid":null,"fwci":1.503,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.87950392,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1956","last_page":"1960"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.8086395859718323},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7943545579910278},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7801331281661987},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6444926261901855},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.61257404088974},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.576560378074646},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5693520903587341},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5477650761604309},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.5286258459091187},{"id":"https://openalex.org/keywords/lexicon","display_name":"Lexicon","score":0.49607548117637634},{"id":"https://openalex.org/keywords/automatic-image-annotation","display_name":"Automatic image annotation","score":0.441714882850647},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4222773313522339},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4038398265838623},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.38894030451774597}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.8086395859718323},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7943545579910278},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7801331281661987},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6444926261901855},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.61257404088974},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.576560378074646},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5693520903587341},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5477650761604309},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.5286258459091187},{"id":"https://openalex.org/C2778121359","wikidata":"https://www.wikidata.org/wiki/Q8096","display_name":"Lexicon","level":2,"score":0.49607548117637634},{"id":"https://openalex.org/C199579030","wikidata":"https://www.wikidata.org/wiki/Q2851778","display_name":"Automatic image annotation","level":4,"score":0.441714882850647},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4222773313522339},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4038398265838623},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.38894030451774597},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp.2016.7472018","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2016.7472018","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.7699999809265137,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W270047479","https://openalex.org/W1666447063","https://openalex.org/W1972969203","https://openalex.org/W1978784480","https://openalex.org/W2003246537","https://openalex.org/W2025684201","https://openalex.org/W2044028121","https://openalex.org/W2044101907","https://openalex.org/W2048782579","https://openalex.org/W2054103873","https://openalex.org/W2066806222","https://openalex.org/W2075880488","https://openalex.org/W2095844239","https://openalex.org/W2106582716","https://openalex.org/W2107034620","https://openalex.org/W2115517344","https://openalex.org/W2120929742","https://openalex.org/W2122715077","https://openalex.org/W2127411609","https://openalex.org/W2127970545","https://openalex.org/W2128197086","https://openalex.org/W2131846894","https://openalex.org/W2155404595","https://openalex.org/W2155985447","https://openalex.org/W2165828254","https://openalex.org/W2167295232","https://openalex.org/W2172231696","https://openalex.org/W2768204113","https://openalex.org/W4301518236","https://openalex.org/W6676013328","https://openalex.org/W6677204712","https://openalex.org/W6678852649","https://openalex.org/W6684451480","https://openalex.org/W6945237511"],"related_works":["https://openalex.org/W3177930984","https://openalex.org/W2052697133","https://openalex.org/W2119028572","https://openalex.org/W2376984068","https://openalex.org/W2152482390","https://openalex.org/W2365617273","https://openalex.org/W2076896210","https://openalex.org/W2093596879","https://openalex.org/W2506386910","https://openalex.org/W2117928543"],"abstract_inverted_index":{"We":[0],"propose":[1],"a":[2,21,29,46,51,59,63,77,82,110],"new":[3],"framework":[4],"for":[5],"automatic":[6],"image":[7,99],"annotation":[8,129],"(AIA)":[9],"of":[10,58,65,112],"regions":[11,36,100,105],"through":[12],"segmentation":[13],"based":[14,49],"semantic":[15],"analysis":[16],"and":[17,106],"discriminative":[18],"classification.":[19],"Given":[20],"test":[22],"image,":[23],"it":[24],"is":[25,69,86],"first":[26],"segmented":[27],"by":[28,39,81],"proposed":[30,121],"texture-enhanced":[31],"JSEG":[32],"algorithm.":[33],"Then":[34],"these":[35],"are":[37,95],"represented":[38],"an":[40],"extended":[41],"bag-of-words":[42],"model":[43],"in":[44],"which":[45],"feature":[47],"vector,":[48],"on":[50,109],"visual":[52,60,67],"lexicon":[53],"with":[54,101],"its":[55],"vocabulary":[56],"consisting":[57],"word":[61],"or":[62],"co-occurrence":[64],"multiple":[66,102],"words,":[68],"constructed":[70],"to":[71,88,123],"represent":[72],"the":[73,90,113],"region":[74,91,124],"content.":[75],"Finally":[76],"concept":[78],"classifier":[79],"learned":[80],"maximal":[83],"figure-of-merit":[84],"algorithm":[85],"used":[87],"predict":[89],"labels.":[92],"These":[93],"models":[94],"discriminatively":[96],"trained":[97],"from":[98],"associations":[103],"between":[104],"concepts.":[107],"Experiments":[108],"subset":[111],"Corel":[114],"5K":[115],"data":[116],"set":[117],"illustrate":[118],"that":[119],"our":[120],"approach":[122],"AIA":[125],"achieves":[126],"more":[127],"accurate":[128],"results":[130],"than":[131],"some":[132],"sate-of-the-art":[133],"algorithms.":[134]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
