{"id":"https://openalex.org/W4403791444","doi":"https://doi.org/10.1145/3664647.3680925","title":"LOVD: Large-and-Open Vocabulary Object Detection","display_name":"LOVD: Large-and-Open Vocabulary Object Detection","publication_year":2024,"publication_date":"2024-10-26","ids":{"openalex":"https://openalex.org/W4403791444","doi":"https://doi.org/10.1145/3664647.3680925"},"language":"en","primary_location":{"id":"doi:10.1145/3664647.3680925","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3680925","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113006444","display_name":"Shiyao Tang","orcid":null},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shiyu Tang","raw_affiliation_strings":["Dalian University of Technology, Dalian, China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology, Dalian, China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100845264","display_name":"Zhaofan Luo","orcid":null},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhaofan Luo","raw_affiliation_strings":["Dalian University of Technology, Dalian, China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology, Dalian, China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100398548","display_name":"Yifan Wang","orcid":"https://orcid.org/0000-0002-1911-2526"},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yifan Wang","raw_affiliation_strings":["Dalian University of Technology, Dalian, China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology, Dalian, China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100318892","display_name":"Lijun Wang","orcid":"https://orcid.org/0000-0003-2538-8358"},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lijun Wang","raw_affiliation_strings":["Dalian University of Technology, Dalian, China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology, Dalian, China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006986293","display_name":"Huchuan Lu","orcid":"https://orcid.org/0000-0002-6668-9758"},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huchuan Lu","raw_affiliation_strings":["Dalian University of Technology, Dalian, China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology, Dalian, China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114255302","display_name":"Wei-Kai Su","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Weibo Su","raw_affiliation_strings":["OPPO, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"OPPO, Shenzhen, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5111401023","display_name":"Libo Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Libo Liu","raw_affiliation_strings":["OPPO, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"OPPO, Shenzhen, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5113006444"],"corresponding_institution_ids":["https://openalex.org/I27357992"],"apc_list":null,"apc_paid":null,"fwci":0.2493,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.54525662,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"9321","last_page":"9329"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7605105042457581},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.5642415285110474},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5614237785339355},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5437704920768738},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4639453887939453},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3581000566482544},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.33219659328460693},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.21265661716461182},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.12601003050804138}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7605105042457581},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.5642415285110474},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5614237785339355},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5437704920768738},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4639453887939453},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3581000566482544},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.33219659328460693},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.21265661716461182},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.12601003050804138},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3664647.3680925","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3680925","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.800000011920929,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W2031489346","https://openalex.org/W2963936013","https://openalex.org/W3205021045","https://openalex.org/W4206811189","https://openalex.org/W4288083516","https://openalex.org/W4292828970","https://openalex.org/W4310557340","https://openalex.org/W4312424618","https://openalex.org/W4312825288","https://openalex.org/W4312956471","https://openalex.org/W4382450414","https://openalex.org/W4386076029","https://openalex.org/W4387968307","https://openalex.org/W4387969137","https://openalex.org/W4387969559","https://openalex.org/W4388189856","https://openalex.org/W4388283733","https://openalex.org/W4389888036","https://openalex.org/W4390872928","https://openalex.org/W4393150063"],"related_works":["https://openalex.org/W2349784553","https://openalex.org/W3022596247","https://openalex.org/W2601444686","https://openalex.org/W4307058054","https://openalex.org/W4292238148","https://openalex.org/W4323660495","https://openalex.org/W2385319785","https://openalex.org/W2900827440","https://openalex.org/W4292830139","https://openalex.org/W4319309705"],"abstract_inverted_index":{"Existing":[0],"open-vocabulary":[1,209],"object":[2,49],"detectors":[3,57],"require":[4],"an":[5,73],"accurate":[6],"and":[7,28,83,97,112,167,170,191,197],"compact":[8,134,153],"vocabulary":[9,24,135],"pre-defined":[10],"during":[11],"inference.":[12],"Their":[13],"performance":[14],"is":[15,188],"largely":[16],"degraded":[17],"in":[18,75,164],"real":[19,53],"scenarios":[20,54],"where":[21],"the":[22,80,107,119,123,138,143,152,158,172,183],"underlying":[23],"may":[25],"be":[26,199,214],"indeterminate":[27],"often":[29],"exponentially":[30],"large.":[31],"To":[32,89,117],"have":[33],"a":[34,43,95,133,177],"more":[35,189],"comprehensive":[36],"understanding":[37],"of":[38,63,122,142],"this":[39,91],"phenomenon,":[40],"we":[41],"propose":[42,94],"new":[44],"setting":[45],"called":[46],"Large-and-Open":[47],"Vocabulary":[48,99],"Detection,":[50],"which":[51],"simulates":[52],"by":[55,148,160],"testing":[56],"with":[58,102,202],"large":[59,125,144,194],"vocabularies":[60],"containing":[61],"thousands":[62],"unseen":[64,68],"categories.":[65],"The":[66,211],"vast":[67],"categories":[69,175],"inevitably":[70],"lead":[71],"to":[72,85,131,137,182,193,206],"increase":[74],"category":[76,120],"distractors,":[77],"severely":[78],"impeding":[79],"recognition":[81,130],"process":[82],"leading":[84],"unsatisfactory":[86],"detection":[87,174,204],"results.":[88],"address":[90],"challenge,":[92],"We":[93],"Large":[96],"Open":[98],"Detector":[100],"(LOVD)":[101],"two":[103],"core":[104],"components,":[105],"termed":[106],"Image-to-Region":[108],"Filtering":[109],"(IRF)":[110],"module":[111],"Cross-View":[113],"Verification":[114],"(CV2)":[115],"scheme.":[116],"relieve":[118],"distractors":[121],"given":[124],"vocabularies,":[126,196],"IRF":[127,159],"performs":[128],"image-level":[129],"build":[132],"relevant":[136],"image":[139],"scene":[140],"out":[141],"input":[145,195],"vocabulary,":[146],"followed":[147],"region-level":[149],"classification":[150],"upon":[151],"vocabulary.":[154],"CV2":[155],"further":[156],"enhances":[157],"conducting":[161],"image-to-region":[162],"filtering":[163],"both":[165],"global":[166],"local":[168],"views":[169],"produces":[171],"final":[173],"through":[176],"two-branch":[178],"voting":[179],"mechanism.":[180],"Compared":[181],"prior":[184],"works,":[185],"our":[186],"LOVD":[187],"scalable":[190],"robust":[192],"can":[198,213],"seamlessly":[200],"integrated":[201],"predominant":[203],"methods":[205],"improve":[207],"their":[208],"performance.":[210],"code":[212],"found":[215],"at":[216],"https://github.com/Altria-luo/LOVD.":[217]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
