{"id":"https://openalex.org/W1998299325","doi":"https://doi.org/10.1109/cvpr.2015.7298982","title":"Watch and learn: Semi-supervised learning of object detectors from videos","display_name":"Watch and learn: Semi-supervised learning of object detectors from videos","publication_year":2015,"publication_date":"2015-06-01","ids":{"openalex":"https://openalex.org/W1998299325","doi":"https://doi.org/10.1109/cvpr.2015.7298982","mag":"1998299325"},"language":"en","primary_location":{"id":"doi:10.1109/cvpr.2015.7298982","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr.2015.7298982","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000623592","display_name":"Ishan Misra","orcid":"https://orcid.org/0000-0001-7708-7261"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ishan Misra","raw_affiliation_strings":["Robotics Institute, Carnegie Mellon University","Robotics Institute, Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Robotics Institute, Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Robotics Institute, Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101614443","display_name":"Abhinav Shrivastava","orcid":"https://orcid.org/0000-0001-8928-8554"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Abhinav Shrivastava","raw_affiliation_strings":["Robotics Institute, Carnegie Mellon University","Robotics Institute, Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Robotics Institute, Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Robotics Institute, Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075246991","display_name":"Martial Hebert","orcid":"https://orcid.org/0000-0003-4566-5930"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Martial Hebert","raw_affiliation_strings":["Robotics Institute, Carnegie Mellon University","Robotics Institute, Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Robotics Institute, Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Robotics Institute, Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5000623592"],"corresponding_institution_ids":["https://openalex.org/I74973139"],"apc_list":null,"apc_paid":null,"fwci":6.4434,"has_fulltext":false,"cited_by_count":98,"citation_normalized_percentile":{"value":0.97708619,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"3593","last_page":"3602"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7979711294174194},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.7112276554107666},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6817375421524048},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.6323373317718506},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.564681351184845},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.488061785697937},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4849303066730499},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.4839901924133301},{"id":"https://openalex.org/keywords/supervised-learning","display_name":"Supervised learning","score":0.47753942012786865},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.4758836328983307},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.46722280979156494},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.4636228382587433},{"id":"https://openalex.org/keywords/method","display_name":"Method","score":0.4582272469997406},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4567798376083374},{"id":"https://openalex.org/keywords/contrast","display_name":"Contrast (vision)","score":0.42809727787971497},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.4173424541950226},{"id":"https://openalex.org/keywords/learning-object","display_name":"Learning object","score":0.4113450050354004},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.32166534662246704},{"id":"https://openalex.org/keywords/object-oriented-programming","display_name":"Object-oriented programming","score":0.12862750887870789}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7979711294174194},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.7112276554107666},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6817375421524048},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.6323373317718506},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.564681351184845},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.488061785697937},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4849303066730499},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.4839901924133301},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.47753942012786865},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.4758836328983307},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.46722280979156494},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.4636228382587433},{"id":"https://openalex.org/C512554520","wikidata":"https://www.wikidata.org/wiki/Q815844","display_name":"Method","level":3,"score":0.4582272469997406},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4567798376083374},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.42809727787971497},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.4173424541950226},{"id":"https://openalex.org/C2779542340","wikidata":"https://www.wikidata.org/wiki/Q1062461","display_name":"Learning object","level":2,"score":0.4113450050354004},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32166534662246704},{"id":"https://openalex.org/C73752529","wikidata":"https://www.wikidata.org/wiki/Q79872","display_name":"Object-oriented programming","level":2,"score":0.12862750887870789},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cvpr.2015.7298982","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr.2015.7298982","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.6800000071525574}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":73,"referenced_works":["https://openalex.org/W24089286","https://openalex.org/W82130502","https://openalex.org/W88868203","https://openalex.org/W1506536088","https://openalex.org/W1565206031","https://openalex.org/W1601728199","https://openalex.org/W1659581753","https://openalex.org/W1807914171","https://openalex.org/W1861492603","https://openalex.org/W1922288304","https://openalex.org/W1964763677","https://openalex.org/W1973054923","https://openalex.org/W1982428585","https://openalex.org/W1989684337","https://openalex.org/W1990342138","https://openalex.org/W2016053056","https://openalex.org/W2016135469","https://openalex.org/W2035652042","https://openalex.org/W2037227137","https://openalex.org/W2045724293","https://openalex.org/W2056933870","https://openalex.org/W2062671023","https://openalex.org/W2070927566","https://openalex.org/W2074753351","https://openalex.org/W2079057609","https://openalex.org/W2081613070","https://openalex.org/W2088049833","https://openalex.org/W2098941887","https://openalex.org/W2102605133","https://openalex.org/W2102689555","https://openalex.org/W2105297725","https://openalex.org/W2106229755","https://openalex.org/W2108598243","https://openalex.org/W2115579991","https://openalex.org/W2116946038","https://openalex.org/W2118897962","https://openalex.org/W2122457239","https://openalex.org/W2124211486","https://openalex.org/W2128715914","https://openalex.org/W2129305389","https://openalex.org/W2133348086","https://openalex.org/W2136475381","https://openalex.org/W2142996775","https://openalex.org/W2150066425","https://openalex.org/W2154683974","https://openalex.org/W2160160833","https://openalex.org/W2162813810","https://openalex.org/W2163292664","https://openalex.org/W2163605009","https://openalex.org/W2167090521","https://openalex.org/W2168356304","https://openalex.org/W2169177311","https://openalex.org/W2171243491","https://openalex.org/W2295262250","https://openalex.org/W2296526710","https://openalex.org/W2308045930","https://openalex.org/W2546643512","https://openalex.org/W3021229333","https://openalex.org/W3022547535","https://openalex.org/W4256379134","https://openalex.org/W4376522650","https://openalex.org/W6603374121","https://openalex.org/W6603540024","https://openalex.org/W6603613150","https://openalex.org/W6637207276","https://openalex.org/W6638399501","https://openalex.org/W6639102338","https://openalex.org/W6664576054","https://openalex.org/W6675547039","https://openalex.org/W6675954300","https://openalex.org/W6676297131","https://openalex.org/W6678569274","https://openalex.org/W6684191040"],"related_works":["https://openalex.org/W1451354128","https://openalex.org/W2082067302","https://openalex.org/W2559114496","https://openalex.org/W3177669699","https://openalex.org/W2145256756","https://openalex.org/W2533037550","https://openalex.org/W2765190739","https://openalex.org/W4389544072","https://openalex.org/W1502661168","https://openalex.org/W1566031736"],"abstract_inverted_index":{"We":[0,14,33],"present":[1],"a":[2,17,77,132],"semi-supervised":[3,45],"approach":[4,53,124],"that":[5],"localizes":[6],"multiple":[7,84,102],"unknown":[8],"object":[9,31,38,61,85,103,146],"instances":[10,86,104],"in":[11,63,75,87],"long":[12],"videos.":[13],"start":[15],"with":[16],"handful":[18],"of":[19,28,30,59,71,90,113,122,134],"labeled":[20,129],"boxes":[21],"and":[22,25,40,48,141],"iteratively":[23],"learn":[24],"label":[26],"hundreds":[27],"thousands":[29],"instances.":[32],"propose":[34],"criteria":[35],"for":[36,42],"reliable":[37],"detection":[39],"tracking":[41],"constraining":[43],"the":[44,111,114,120,127],"learning":[46],"process":[47],"minimizing":[49],"semantic":[50],"drift.":[51],"Our":[52],"does":[54],"not":[55,100],"assume":[56],"exhaustive":[57],"labeling":[58],"each":[60],"instance":[62],"any":[64,68],"single":[65],"frame,":[66],"or":[67,107],"explicit":[69],"annotation":[70],"negative":[72],"data.":[73],"Working":[74],"such":[76],"generic":[78],"setting":[79],"allow":[80],"us":[81],"to":[82,143],"tackle":[83],"video,":[88,106],"many":[89],"which":[91],"are":[92],"static.":[93],"In":[94],"contrast,":[95],"existing":[96],"approaches":[97],"either":[98],"do":[99],"consider":[101],"per":[105],"rely":[108],"heavily":[109],"on":[110,131],"motion":[112],"objects":[115],"present.":[116],"The":[117],"experiments":[118],"demonstrate":[119],"effectiveness":[121],"our":[123],"by":[125],"evaluating":[126],"automatically":[128],"data":[130],"variety":[133],"metrics":[135],"like":[136],"quality,":[137],"coverage":[138],"(recall),":[139],"diversity,":[140],"relevance":[142],"training":[144],"an":[145],"detector.":[147]},"counts_by_year":[{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":11},{"year":2021,"cited_by_count":17},{"year":2020,"cited_by_count":16},{"year":2019,"cited_by_count":11},{"year":2018,"cited_by_count":11},{"year":2017,"cited_by_count":12},{"year":2016,"cited_by_count":9},{"year":2015,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
