{"id":"https://openalex.org/W2973725754","doi":"https://doi.org/10.1109/tpami.2020.3024207","title":"Grid Anchor Based Image Cropping: A New Benchmark and An Efficient Model","display_name":"Grid Anchor Based Image Cropping: A New Benchmark and An Efficient Model","publication_year":2020,"publication_date":"2020-09-15","ids":{"openalex":"https://openalex.org/W2973725754","doi":"https://doi.org/10.1109/tpami.2020.3024207","mag":"2973725754","pmid":"https://pubmed.ncbi.nlm.nih.gov/32931429"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2020.3024207","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2020.3024207","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Hui Zeng","orcid":"https://orcid.org/0000-0001-6862-6964"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Hui Zeng","raw_affiliation_strings":["Department of Computing, The Hong Kong Polytechnic University, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Computing, The Hong Kong Polytechnic University, Hong Kong","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Lida Li","orcid":"https://orcid.org/0000-0001-9386-194X"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Lida Li","raw_affiliation_strings":["Department of Computing, The Hong Kong Polytechnic University, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Computing, The Hong Kong Polytechnic University, Hong Kong","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zisheng Cao","orcid":"https://orcid.org/0000-0002-7037-8039"},"institutions":[{"id":"https://openalex.org/I4210148944","display_name":"D\u00e0-Ji\u0101ng Innovations Science and Technology (China)","ror":"https://ror.org/04fmkfb67","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210148944"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zisheng Cao","raw_affiliation_strings":["Camera Group of DJI Innovations Company, Ltd, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Camera Group of DJI Innovations Company, Ltd, Shenzhen, China","institution_ids":["https://openalex.org/I4210148944"]}]},{"author_position":"last","author":{"id":null,"display_name":"Lei Zhang","orcid":"https://orcid.org/0000-0002-2078-4215"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Lei Zhang","raw_affiliation_strings":["Department of Computing, The Hong Kong Polytechnic University, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Computing, The Hong Kong Polytechnic University, Hong Kong","institution_ids":["https://openalex.org/I14243506"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I14243506"],"apc_list":null,"apc_paid":null,"fwci":1.0793,"has_fulltext":false,"cited_by_count":37,"citation_normalized_percentile":{"value":0.79198803,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":"44","issue":"3","first_page":"1304","last_page":"1319"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.25920000672340393,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.25920000672340393,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.22010000050067902,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.19760000705718994,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7315999865531921},{"id":"https://openalex.org/keywords/cropping","display_name":"Cropping","score":0.6916999816894531},{"id":"https://openalex.org/keywords/grid","display_name":"Grid","score":0.6244999766349792},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.6128000020980835},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5727999806404114},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.4431999921798706},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.3991999924182892},{"id":"https://openalex.org/keywords/image-processing","display_name":"Image processing","score":0.3855000138282776}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7383999824523926},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7315999865531921},{"id":"https://openalex.org/C13558536","wikidata":"https://www.wikidata.org/wiki/Q785116","display_name":"Cropping","level":3,"score":0.6916999816894531},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.6244999766349792},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.6128000020980835},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5727999806404114},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5497999787330627},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4846000075340271},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.4431999921798706},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.3991999924182892},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.3855000138282776},{"id":"https://openalex.org/C55020928","wikidata":"https://www.wikidata.org/wiki/Q3813865","display_name":"Image quality","level":3,"score":0.37610000371932983},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3409999907016754},{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.3206999897956848},{"id":"https://openalex.org/C63099799","wikidata":"https://www.wikidata.org/wiki/Q17147001","display_name":"Image texture","level":4,"score":0.3034000098705292},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.30090001225471497},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.298799991607666},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.28439998626708984},{"id":"https://openalex.org/C205372480","wikidata":"https://www.wikidata.org/wiki/Q210521","display_name":"Image resolution","level":2,"score":0.2678000032901764},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.26190000772476196},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2565000057220459},{"id":"https://openalex.org/C3115412","wikidata":"https://www.wikidata.org/wiki/Q1194708","display_name":"Bitmap","level":2,"score":0.250900000333786}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019985","descriptor_name":"Benchmarking","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D019985","descriptor_name":"Benchmarking","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D019985","descriptor_name":"Benchmarking","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2020.3024207","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2020.3024207","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:32931429","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/32931429","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W1498238238","https://openalex.org/W1849277567","https://openalex.org/W1975521048","https://openalex.org/W1997095443","https://openalex.org/W2001070410","https://openalex.org/W2013339738","https://openalex.org/W2023081159","https://openalex.org/W2046033161","https://openalex.org/W2060502770","https://openalex.org/W2078807908","https://openalex.org/W2082335776","https://openalex.org/W2100618994","https://openalex.org/W2103598646","https://openalex.org/W2107363596","https://openalex.org/W2116510306","https://openalex.org/W2128272608","https://openalex.org/W2142785776","https://openalex.org/W2164989680","https://openalex.org/W2165810675","https://openalex.org/W2194775991","https://openalex.org/W2417288846","https://openalex.org/W2467818129","https://openalex.org/W2529088810","https://openalex.org/W2556068545","https://openalex.org/W2575939610","https://openalex.org/W2586372171","https://openalex.org/W2754213847","https://openalex.org/W2775725209","https://openalex.org/W2798986039","https://openalex.org/W2804743778","https://openalex.org/W2883780447","https://openalex.org/W2963010685","https://openalex.org/W2963150697","https://openalex.org/W2963156339","https://openalex.org/W2963163009","https://openalex.org/W2963312801","https://openalex.org/W2964332053","https://openalex.org/W6631190155","https://openalex.org/W6631943919","https://openalex.org/W6637373629","https://openalex.org/W6684191040","https://openalex.org/W6772035322"],"related_works":[],"abstract_inverted_index":{"Image":[0],"cropping":[1,26,49,67,123,160],"aims":[2],"to":[3,113],"improve":[4],"the":[5,23,37,43,62,73,87,105,144,165],"composition":[6],"as":[7,9,36,57],"well":[8],"aesthetic":[10],"quality":[11],"of":[12,22,47,65,75,99,108,130,147,167,171,187,201],"an":[13,156],"image":[14,25,48,76,100,132],"by":[15,85],"removing":[16],"extraneous":[17],"content":[18,95],"from":[19,111],"it.":[20],"Most":[21],"existing":[24],"databases":[27],"provide":[28],"only":[29],"one":[30,205,214],"or":[31],"several":[32],"human-annotated":[33],"bounding":[34],"boxes":[35],"groundtruths,":[38],"which":[39],"can":[40,179],"hardly":[41],"reflect":[42,61],"non-uniqueness":[44],"and":[45,78,90,135,150,158,169,173,210],"flexibility":[46],"in":[50],"practice.":[51],"The":[52,217],"employed":[53],"evaluation":[54,138],"metrics":[55,139],"such":[56],"intersection-over-union":[58],"cannot":[59],"reliably":[60],"real":[63],"performance":[64,149],"a":[66,80,119,199],"model,":[68],"either.":[69],"This":[70],"work":[71],"revisits":[72],"problem":[74],"cropping,":[77],"presents":[79],"grid":[81,120],"anchor":[82,121],"based":[83,122],"formulation":[84,103],"considering":[86,164],"special":[88],"properties":[89],"requirements":[91],"(e.g.,":[92],"local":[93],"redundancy,":[94],"preservation,":[96],"aspect":[97],"ratio)":[98],"cropping.":[101],"Our":[102],"reduces":[104],"searching":[106],"space":[107],"candidate":[109],"crops":[110,129,184],"millions":[112],"no":[114],"more":[115,136],"than":[116,192],"ninety.":[117],"Consequently,":[118],"benchmark":[124],"is":[125,219],"constructed,":[126],"where":[127],"all":[128],"each":[131],"are":[133,140],"annotated":[134],"reliable":[137],"defined.":[141],"To":[142],"meet":[143],"practical":[145],"demands":[146],"robust":[148],"high":[151],"efficiency,":[152],"we":[153],"also":[154],"design":[155],"effective":[157],"lightweight":[159],"model.":[161],"By":[162],"simultaneously":[163],"region":[166,170],"interest":[168],"discard,":[172],"leveraging":[174],"multi-scale":[175],"information,":[176],"our":[177,195],"model":[178,196],"robustly":[180],"output":[181],"visually":[182],"pleasing":[183],"for":[185],"images":[186],"different":[188],"scenes.":[189],"With":[190],"less":[191],"2.5M":[193],"parameters,":[194],"runs":[197],"at":[198],"speed":[200],"200":[202],"FPS":[203,212],"on":[204,213],"single":[206],"GTX":[207],"1080Ti":[208],"GPU":[209],"12":[211],"i7-6800K":[215],"CPU.":[216],"code":[218],"available":[220],"at:":[221],"https://github.com/HuiZeng/Grid-Anchor-based-Image-Cropping-Pytorch.":[222]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":15},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":7},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2019-09-26T00:00:00"}
