{"id":"https://openalex.org/W3180266489","doi":"https://doi.org/10.1145/3474085.3475530","title":"Towards Accurate Localization by Instance Search","display_name":"Towards Accurate Localization by Instance Search","publication_year":2021,"publication_date":"2021-10-17","ids":{"openalex":"https://openalex.org/W3180266489","doi":"https://doi.org/10.1145/3474085.3475530","mag":"3180266489"},"language":"en","primary_location":{"id":"doi:10.1145/3474085.3475530","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3474085.3475530","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2107.05005","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Yi-Geng Hong","orcid":null},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yi-Geng Hong","raw_affiliation_strings":["Xiamen University, Xiamen, China"],"affiliations":[{"raw_affiliation_string":"Xiamen University, Xiamen, China","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Hui-Chu Xiao","orcid":null},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hui-Chu Xiao","raw_affiliation_strings":["Xiamen University, Xiamen, China"],"affiliations":[{"raw_affiliation_string":"Xiamen University, Xiamen, China","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"last","author":{"id":null,"display_name":"Wan-Lei Zhao","orcid":null},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wan-Lei Zhao","raw_affiliation_strings":["Xiamen University, Xiamen, China"],"affiliations":[{"raw_affiliation_string":"Xiamen University, Xiamen, China","institution_ids":["https://openalex.org/I191208505"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I191208505"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.07729843,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"3807","last_page":"3815"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.7218999862670898},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.6459000110626221},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.5094000101089478},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5001000165939331},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.4708000123500824},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.45590001344680786},{"id":"https://openalex.org/keywords/viola\u2013jones-object-detection-framework","display_name":"Viola\u2013Jones object detection framework","score":0.41019999980926514}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7336999773979187},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.7218999862670898},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6660000085830688},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.6459000110626221},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5759999752044678},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.5094000101089478},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5001000165939331},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.4708000123500824},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.45590001344680786},{"id":"https://openalex.org/C182521987","wikidata":"https://www.wikidata.org/wiki/Q2493877","display_name":"Viola\u2013Jones object detection framework","level":5,"score":0.41019999980926514},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.4077000021934509},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.32679998874664307},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.3260999917984009},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.32260000705718994},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.31060001254081726},{"id":"https://openalex.org/C71681937","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object-class detection","level":5,"score":0.27720001339912415},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.27000001072883606},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.26159998774528503},{"id":"https://openalex.org/C143724316","wikidata":"https://www.wikidata.org/wiki/Q312468","display_name":"Series (stratigraphy)","level":2,"score":0.25369998812675476}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3474085.3475530","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3474085.3475530","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Multimedia","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2107.05005","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2107.05005","pdf_url":"https://arxiv.org/pdf/2107.05005","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2107.05005","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2107.05005","pdf_url":"https://arxiv.org/pdf/2107.05005","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8375933051","display_name":null,"funder_award_id":"61972326","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1861492603","https://openalex.org/W1999478155","https://openalex.org/W2031489346","https://openalex.org/W2040002737","https://openalex.org/W2117539524","https://openalex.org/W2126302311","https://openalex.org/W2133324800","https://openalex.org/W2158592639","https://openalex.org/W2194775991","https://openalex.org/W2248800885","https://openalex.org/W2295537791","https://openalex.org/W2494236530","https://openalex.org/W2592463526","https://openalex.org/W2752782242","https://openalex.org/W2799058067","https://openalex.org/W2806070179","https://openalex.org/W2886910176","https://openalex.org/W2889081631","https://openalex.org/W2891033863","https://openalex.org/W2963037989","https://openalex.org/W2963091558","https://openalex.org/W2963436667","https://openalex.org/W2963534981","https://openalex.org/W2963603913","https://openalex.org/W2964028976","https://openalex.org/W2981398794","https://openalex.org/W2983156430","https://openalex.org/W2993991614","https://openalex.org/W2996583130","https://openalex.org/W2997616671","https://openalex.org/W3009213340","https://openalex.org/W3017351200","https://openalex.org/W3034974675","https://openalex.org/W3097651496","https://openalex.org/W6774983715"],"related_works":[],"abstract_inverted_index":{"Visual":[0],"object":[1,11,61,117,132],"localization":[2,18,62,124],"is":[3,20,56,92,134,146],"the":[4,15,23,64,75,80,95,98,101,104,116,128,138],"key":[5],"step":[6],"in":[7,100],"a":[8,52,89],"series":[9],"of":[10,40,130],"detection":[12,133],"tasks.":[13,150],"In":[14,49,120],"literature,":[16],"high":[17],"accuracy":[19],"achieved":[21],"with":[22],"mainstream":[24],"strongly":[25],"supervised":[26,44],"frameworks.":[27],"However,":[28],"such":[29],"methods":[30,45,145],"require":[31],"object-level":[32],"annotations":[33],"and":[34,82,97],"are":[35],"unable":[36],"to":[37,58,122],"detect":[38],"objects":[39],"unknown":[41],"categories.":[42],"Weakly":[43],"face":[46],"similar":[47],"difficulties.":[48],"this":[50],"paper,":[51],"self-paced":[53],"learning":[54],"framework":[55,73],"proposed":[57,72],"achieve":[59],"accurate":[60],"on":[63,125,148],"rank":[65,102],"list":[66],"returned":[67],"by":[68],"instance":[69,77,91,107,126],"search.":[70],"The":[71],"mines":[74],"target":[76,105],"gradually":[78],"from":[79],"queries":[81],"their":[83],"corresponding":[84],"top-ranked":[85],"search":[86],"results.":[87],"Since":[88],"common":[90],"shared":[93],"between":[94],"query":[96],"images":[99],"list,":[103],"visual":[106],"can":[108],"be":[109],"accurately":[110],"localized":[111],"even":[112],"without":[113],"knowing":[114],"what":[115],"category":[118],"is.":[119],"addition":[121],"performing":[123],"search,":[127],"issue":[129],"few-shot":[131],"also":[135],"addressed":[136],"under":[137],"same":[139],"framework.":[140],"Superior":[141],"performance":[142],"over":[143],"state-of-the-art":[144],"observed":[147],"both":[149]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2021-07-19T00:00:00"}
