{"id":"https://openalex.org/W2912364477","doi":"https://doi.org/10.1109/bigdata.2018.8621935","title":"Fast Bag-Of-Words Candidate Selection in Content-Based Instance Retrieval Systems","display_name":"Fast Bag-Of-Words Candidate Selection in Content-Based Instance Retrieval Systems","publication_year":2018,"publication_date":"2018-12-01","ids":{"openalex":"https://openalex.org/W2912364477","doi":"https://doi.org/10.1109/bigdata.2018.8621935","mag":"2912364477"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata.2018.8621935","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2018.8621935","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015117459","display_name":"Micha\u0142 Siedlaczek","orcid":"https://orcid.org/0000-0002-9168-0851"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Michal Siedlaczek","raw_affiliation_strings":["Tandon School of Engineering, New York University, Brooklyn, NY, USA"],"affiliations":[{"raw_affiliation_string":"Tandon School of Engineering, New York University, Brooklyn, NY, USA","institution_ids":["https://openalex.org/I57206974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100341321","display_name":"Qi Wang","orcid":"https://orcid.org/0000-0002-7028-4956"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Qi Wang","raw_affiliation_strings":["Tandon School of Engineering, New York University, Brooklyn, NY, USA"],"affiliations":[{"raw_affiliation_string":"Tandon School of Engineering, New York University, Brooklyn, NY, USA","institution_ids":["https://openalex.org/I57206974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082130243","display_name":"Yen\u2010Yu Chen","orcid":"https://orcid.org/0000-0002-2920-8871"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yen-Yu Chen","raw_affiliation_strings":["Blippar, Inc., Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"Blippar, Inc., Mountain View, CA, USA","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5074323303","display_name":"Torsten Suel","orcid":"https://orcid.org/0000-0002-8324-980X"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Torsten Suel","raw_affiliation_strings":["Tandon School of Engineering, New York University, Brooklyn, NY, USA"],"affiliations":[{"raw_affiliation_string":"Tandon School of Engineering, New York University, Brooklyn, NY, USA","institution_ids":["https://openalex.org/I57206974"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5015117459"],"corresponding_institution_ids":["https://openalex.org/I57206974"],"apc_list":null,"apc_paid":null,"fwci":0.1045,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.48750776,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"821","last_page":"830"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9940000176429749,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8505716919898987},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.7067773342132568},{"id":"https://openalex.org/keywords/inverted-index","display_name":"Inverted index","score":0.678513765335083},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6340991258621216},{"id":"https://openalex.org/keywords/index","display_name":"Index (typography)","score":0.5471580624580383},{"id":"https://openalex.org/keywords/visual-word","display_name":"Visual Word","score":0.5069830417633057},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.47173061966896057},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.4521874487400055},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4183098077774048},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.4147057831287384},{"id":"https://openalex.org/keywords/selection-algorithm","display_name":"Selection algorithm","score":0.4131251871585846},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.3016563057899475},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.29745161533355713},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.295063853263855}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8505716919898987},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.7067773342132568},{"id":"https://openalex.org/C130590232","wikidata":"https://www.wikidata.org/wiki/Q1671754","display_name":"Inverted index","level":3,"score":0.678513765335083},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6340991258621216},{"id":"https://openalex.org/C2777382242","wikidata":"https://www.wikidata.org/wiki/Q6017816","display_name":"Index (typography)","level":2,"score":0.5471580624580383},{"id":"https://openalex.org/C189391414","wikidata":"https://www.wikidata.org/wiki/Q7936579","display_name":"Visual Word","level":4,"score":0.5069830417633057},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.47173061966896057},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.4521874487400055},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4183098077774048},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.4147057831287384},{"id":"https://openalex.org/C2775973920","wikidata":"https://www.wikidata.org/wiki/Q3252726","display_name":"Selection algorithm","level":3,"score":0.4131251871585846},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3016563057899475},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.29745161533355713},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.295063853263855},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C111368507","wikidata":"https://www.wikidata.org/wiki/Q43518","display_name":"Oceanography","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata.2018.8621935","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2018.8621935","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":68,"referenced_works":["https://openalex.org/W1481738430","https://openalex.org/W1541459201","https://openalex.org/W1595303882","https://openalex.org/W1615295117","https://openalex.org/W1672197616","https://openalex.org/W1677409904","https://openalex.org/W1686810756","https://openalex.org/W1897550784","https://openalex.org/W1973435495","https://openalex.org/W1973520416","https://openalex.org/W1980344365","https://openalex.org/W1986482242","https://openalex.org/W1991360400","https://openalex.org/W1997365529","https://openalex.org/W2000246295","https://openalex.org/W2000431947","https://openalex.org/W2016078760","https://openalex.org/W2039051707","https://openalex.org/W2041517999","https://openalex.org/W2046144220","https://openalex.org/W2065472179","https://openalex.org/W2066636486","https://openalex.org/W2086649520","https://openalex.org/W2097117768","https://openalex.org/W2108079923","https://openalex.org/W2123229215","https://openalex.org/W2124386111","https://openalex.org/W2128017662","https://openalex.org/W2134195052","https://openalex.org/W2134557242","https://openalex.org/W2135050452","https://openalex.org/W2138662031","https://openalex.org/W2141362318","https://openalex.org/W2148809531","https://openalex.org/W2154610494","https://openalex.org/W2158102958","https://openalex.org/W2160484851","https://openalex.org/W2162915993","https://openalex.org/W2163605009","https://openalex.org/W2163652601","https://openalex.org/W2165558283","https://openalex.org/W2194775991","https://openalex.org/W2234701313","https://openalex.org/W2307814545","https://openalex.org/W2342707026","https://openalex.org/W2344779122","https://openalex.org/W2461086877","https://openalex.org/W2499468060","https://openalex.org/W2586017539","https://openalex.org/W2666600683","https://openalex.org/W2740817677","https://openalex.org/W2771723090","https://openalex.org/W2912856763","https://openalex.org/W2963640793","https://openalex.org/W3106250896","https://openalex.org/W4230511558","https://openalex.org/W6628919034","https://openalex.org/W6632397832","https://openalex.org/W6635487554","https://openalex.org/W6636555507","https://openalex.org/W6636955212","https://openalex.org/W6637373629","https://openalex.org/W6637400245","https://openalex.org/W6643393412","https://openalex.org/W6684191040","https://openalex.org/W6724291978","https://openalex.org/W6758526203","https://openalex.org/W6785652829"],"related_works":["https://openalex.org/W2063218608","https://openalex.org/W4386105885","https://openalex.org/W2071180033","https://openalex.org/W2184288218","https://openalex.org/W2947282851","https://openalex.org/W2374066281","https://openalex.org/W4387423606","https://openalex.org/W2147874738","https://openalex.org/W2036058638","https://openalex.org/W2513891871"],"abstract_inverted_index":{"Many":[0],"content-based":[1,101],"image":[2,18,65],"search":[3,118],"and":[4,30,137,148,179,184,208,236],"instance":[5,102,132,160],"retrieval":[6,103,161,201],"systems":[7],"implement":[8],"bag-of-visual-words":[9],"strategies":[10],"for":[11,79,97,116,131],"candidate":[12,47,98],"selection.":[13],"Visual":[14],"processing":[15,41,75],"of":[16,22,44,60,93,123,176,192,230],"an":[17,37,45,198],"results":[19],"in":[20,85,100,150,167,181],"hundreds":[21],"visual":[23],"words":[24,32],"that":[25,50,127,203,224],"make":[26],"up":[27,212],"a":[28,157],"document,":[29],"these":[31],"are":[33,121,140],"used":[34],"to":[35,89,213,226,245],"build":[36],"inverted":[38,53],"index.":[39],"Query":[40],"then":[42],"consists":[43],"initial":[46,68],"selection":[48,99],"phase":[49,69,115],"queries":[51,180],"the":[52,61,91,144,151,173,182,190,217,227,231,242],"index,":[54],"followed":[55],"by":[56],"more":[57],"complex":[58],"reranking":[59],"candidates":[62],"using":[63],"various":[64],"features.":[66],"The":[67],"typically":[70],"uses":[71],"disjunctive":[72,94],"top-k":[73,95],"query":[74,138],"algorithms":[76],"originally":[77],"proposed":[78],"searching":[80],"text":[81,193],"collections.":[82],"Our":[83],"objective":[84],"this":[86,114,129,165],"paper":[87],"is":[88],"optimize":[90],"performance":[92,249],"computation":[96],"systems.":[104],"While":[105],"there":[106],"has":[107],"been":[108],"extensive":[109],"previous":[110],"work":[111,126],"on":[112],"optimizing":[113],"textual":[117,152],"engines,":[119],"we":[120,163,171,196,222],"unaware":[122],"any":[124,247],"published":[125],"studies":[128],"problem":[130],"retrieval,":[133],"where":[134],"both":[135],"index":[136,177],"data":[139,155],"quite":[141],"different":[142,228],"from":[143,156,189,241],"distributions":[145],"commonly":[146],"found":[147],"exploited":[149],"case.":[153],"Using":[154],"commercial":[158],"large-scale":[159],"system,":[162,183],"address":[164],"challenge":[166],"three":[168],"steps.":[169],"First,":[170],"analyze":[172],"quantitative":[174],"properties":[175,229],"structures":[178],"discuss":[185],"how":[186],"they":[187],"differ":[188],"case":[191],"retrieval.":[194],"Second,":[195],"describe":[197],"optimized":[199],"term-at-a-time":[200,207],"strategy":[202],"significantly":[204],"outperforms":[205],"baseline":[206],"document-at-a-time":[209],"strategies,":[210],"achieving":[211],"66%":[214],"speed-up":[215],"over":[216],"most":[218],"efficient":[219],"baseline.":[220],"Finally,":[221],"show":[223],"due":[225],"data,":[232],"several":[233],"common":[234],"safe":[235],"unsafe":[237],"early":[238],"termination":[239],"techniques":[240],"literature":[243],"fail":[244],"provide":[246],"significant":[248],"benefits.":[250]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
