{"id":"https://openalex.org/W3032921344","doi":"https://doi.org/10.1145/3372278.3390682","title":"QIK: A System for Large-Scale Image Retrieval on Everyday Scenes With Common Objects","display_name":"QIK: A System for Large-Scale Image Retrieval on Everyday Scenes With Common Objects","publication_year":2020,"publication_date":"2020-06-02","ids":{"openalex":"https://openalex.org/W3032921344","doi":"https://doi.org/10.1145/3372278.3390682","mag":"3032921344"},"language":"en","primary_location":{"id":"doi:10.1145/3372278.3390682","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3372278.3390682","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2020 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059478823","display_name":"Arun Zachariah","orcid":"https://orcid.org/0000-0002-5608-9089"},"institutions":[{"id":"https://openalex.org/I76835614","display_name":"University of Missouri","ror":"https://ror.org/02ymw8z06","country_code":"US","type":"education","lineage":["https://openalex.org/I76835614"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Arun Zachariah","raw_affiliation_strings":["University of Missouri-Columbia, Columbia, MO, USA"],"affiliations":[{"raw_affiliation_string":"University of Missouri-Columbia, Columbia, MO, USA","institution_ids":["https://openalex.org/I76835614"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079477508","display_name":"Mohamed Gharibi","orcid":null},"institutions":[{"id":"https://openalex.org/I75421653","display_name":"University of Missouri\u2013Kansas City","ror":"https://ror.org/01w0d5g70","country_code":"US","type":"education","lineage":["https://openalex.org/I75421653"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mohamed Gharibi","raw_affiliation_strings":["University of Missouri-Kansas City, Kansas City, MO, USA"],"affiliations":[{"raw_affiliation_string":"University of Missouri-Kansas City, Kansas City, MO, USA","institution_ids":["https://openalex.org/I75421653"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5087950601","display_name":"Praveen Rao","orcid":"https://orcid.org/0000-0002-1859-0438"},"institutions":[{"id":"https://openalex.org/I76835614","display_name":"University of Missouri","ror":"https://ror.org/02ymw8z06","country_code":"US","type":"education","lineage":["https://openalex.org/I76835614"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Praveen Rao","raw_affiliation_strings":["University of Missouri-Columbia, Columbia, MO, USA"],"affiliations":[{"raw_affiliation_string":"University of Missouri-Columbia, Columbia, MO, USA","institution_ids":["https://openalex.org/I76835614"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5059478823"],"corresponding_institution_ids":["https://openalex.org/I76835614"],"apc_list":null,"apc_paid":null,"fwci":0.2931,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.55264838,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"126","last_page":"135"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9937999844551086,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.851158857345581},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7505447268486023},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6842666864395142},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.6054747104644775},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.5763687491416931},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.5736501812934875},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.5663415193557739},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5344658493995667},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.5233882069587708},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.49387747049331665},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.44640421867370605},{"id":"https://openalex.org/keywords/tree-structure","display_name":"Tree structure","score":0.4448099434375763},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4438605308532715},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.375122606754303},{"id":"https://openalex.org/keywords/data-structure","display_name":"Data structure","score":0.15867763757705688}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.851158857345581},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7505447268486023},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6842666864395142},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.6054747104644775},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.5763687491416931},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.5736501812934875},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.5663415193557739},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5344658493995667},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.5233882069587708},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.49387747049331665},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.44640421867370605},{"id":"https://openalex.org/C163797641","wikidata":"https://www.wikidata.org/wiki/Q2067937","display_name":"Tree structure","level":3,"score":0.4448099434375763},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4438605308532715},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.375122606754303},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.15867763757705688},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3372278.3390682","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3372278.3390682","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2020 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.8199999928474426}],"awards":[{"id":"https://openalex.org/G7621532285","display_name":null,"funder_award_id":"1747751","funder_id":"https://openalex.org/F4320315254","funder_display_name":"Innovative Research Group Project of the National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320315254","display_name":"Innovative Research Group Project of the National Natural Science Foundation of China","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W204268067","https://openalex.org/W639708223","https://openalex.org/W1556531089","https://openalex.org/W1976794880","https://openalex.org/W1978478796","https://openalex.org/W1981857004","https://openalex.org/W1984309565","https://openalex.org/W2028509346","https://openalex.org/W2097117768","https://openalex.org/W2119605622","https://openalex.org/W2141362318","https://openalex.org/W2148809531","https://openalex.org/W2151103935","https://openalex.org/W2185175083","https://openalex.org/W2187250581","https://openalex.org/W2250861254","https://openalex.org/W2295537791","https://openalex.org/W2340690086","https://openalex.org/W2463955103","https://openalex.org/W2884354140","https://openalex.org/W2912083425","https://openalex.org/W2912380520","https://openalex.org/W2913059114","https://openalex.org/W2963588253","https://openalex.org/W2964157791","https://openalex.org/W4214540501","https://openalex.org/W4238358009","https://openalex.org/W4249142012","https://openalex.org/W4249852273","https://openalex.org/W4297683907"],"related_works":["https://openalex.org/W579810227","https://openalex.org/W2952780262","https://openalex.org/W2979495269","https://openalex.org/W51364034","https://openalex.org/W2050340680","https://openalex.org/W2898073868","https://openalex.org/W1700641177","https://openalex.org/W4284663758","https://openalex.org/W2953384362","https://openalex.org/W1568205884"],"abstract_inverted_index":{"In":[0,198],"this":[1,199],"paper,":[2],"we":[3],"propose":[4],"a":[5,37,122,126,129,160],"system":[6,43,57,217,233],"for":[7,52,244],"large-scale":[8,245],"image":[9,34,53,84,98,191,246],"retrieval":[10],"on":[11,155,177,184,218],"everyday":[12,67,224],"scenes":[13,225],"with":[14],"common":[15,227],"objects":[16,64,74,95,186],"by":[17,48,110],"leveraging":[18],"advances":[19],"in":[20,65,75,85,96,121,188,238],"deep":[21,49,101,137],"learning":[22,102,138],"and":[23,93,108,119,139,153,196,229],"natural":[24],"language":[25],"processing":[26],"(NLP).":[27],"Unlike":[28],"recent":[29],"state-of-the-art":[30,100,236],"approaches":[31],"that":[32,231],"extract":[33],"features":[35],"from":[36],"convolutional":[38],"neural":[39,50],"network":[40],"(CNN),":[41],"our":[42,216,232],"exploits":[44],"the":[45,61,72,76,86,97,156,172,178,189,201,205,208,213,219],"predictions":[46],"made":[47],"networks":[51],"understanding":[54],"tasks.":[55],"Our":[56],"aims":[58],"to":[59,158],"capture":[60],"relationships":[62],"between":[63],"an":[66,147],"scene":[68],"rather":[69],"than":[70],"just":[71],"individual":[73],"scene.":[77],"It":[78],"works":[79],"as":[80],"follows:":[81],"For":[82],"each":[83],"database,":[87],"it":[88],"generates":[89],"most":[90],"probable":[91],"captions":[92,105],"detects":[94],"using":[99,113,136,171],"models.":[103],"The":[104],"are":[106,117,169],"parsed":[107,140],"represented":[109],"tree":[111,144,179],"structures":[112],"NLP":[114],"techniques.":[115],"These":[116],"stored":[118],"indexed":[120],"database":[123,157],"system.":[124],"When":[125],"user":[127],"poses":[128],"query":[130,150,182,190],"image,":[131],"its":[132,142],"caption":[133],"is":[134,151],"generated":[135],"into":[141],"corresponding":[143],"structures.":[145,180],"Then":[146],"optimized":[148],"tree-pattern":[149],"constructed":[152],"executed":[154],"retrieve":[159],"set":[161],"of":[162,207,215,240],"candidate":[163,167],"images.":[164],"Finally,":[165],"these":[166],"images":[168],"ranked":[170],"tree-edit":[173],"distance":[174],"metric":[175],"computed":[176],"A":[181],"based":[183],"only":[185],"detected":[187,209],"can":[192,234],"also":[193],"be":[194],"formulated":[195],"executed.":[197],"case,":[200],"ranking":[202],"scheme":[203],"uses":[204],"probabilities":[206],"objects.":[210],"We":[211],"evaluated":[212],"performance":[214],"Microsoft":[220],"COCO":[221],"dataset":[222],"containing":[223],"(with":[226],"objects)":[228],"observed":[230],"outperform":[235],"techniques":[237],"terms":[239],"mean":[241],"average":[242],"precision":[243],"retrieval.":[247]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
