{"id":"https://openalex.org/W1920142129","doi":"https://doi.org/10.1109/cvpr.2015.7298987","title":"Semantic object segmentation via detection in weakly labeled video","display_name":"Semantic object segmentation via detection in weakly labeled video","publication_year":2015,"publication_date":"2015-06-01","ids":{"openalex":"https://openalex.org/W1920142129","doi":"https://doi.org/10.1109/cvpr.2015.7298987","mag":"1920142129"},"language":"en","primary_location":{"id":"doi:10.1109/cvpr.2015.7298987","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr.2015.7298987","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100651152","display_name":"Yu Zhang","orcid":"https://orcid.org/0000-0002-9653-3906"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yu Zhang","raw_affiliation_strings":["State Key Laboratory of Virtual Reality Technology and Systems, School of Computer Science and Engineering, Beihang University","State Key Laboratory of Virtual Reality Technology and Systems, School of Computer Science and Engineering, Beihang University, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Virtual Reality Technology and Systems, School of Computer Science and Engineering, Beihang University","institution_ids":["https://openalex.org/I82880672"]},{"raw_affiliation_string":"State Key Laboratory of Virtual Reality Technology and Systems, School of Computer Science and Engineering, Beihang University, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101579465","display_name":"Xiaowu Chen","orcid":"https://orcid.org/0000-0002-3976-6500"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaowu Chen","raw_affiliation_strings":["State Key Laboratory of Virtual Reality Technology and Systems, School of Computer Science and Engineering, Beihang University","State Key Laboratory of Virtual Reality Technology and Systems, School of Computer Science and Engineering, Beihang University, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Virtual Reality Technology and Systems, School of Computer Science and Engineering, Beihang University","institution_ids":["https://openalex.org/I82880672"]},{"raw_affiliation_string":"State Key Laboratory of Virtual Reality Technology and Systems, School of Computer Science and Engineering, Beihang University, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100783533","display_name":"Jia Li","orcid":"https://orcid.org/0000-0003-3443-4651"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jia Li","raw_affiliation_strings":["International Research Institute for Multidisciplinary Science, Beihang University","State Key Laboratory of Virtual Reality Technology and Systems, School of Computer Science and Engineering, Beihang University, China"],"affiliations":[{"raw_affiliation_string":"International Research Institute for Multidisciplinary Science, Beihang University","institution_ids":["https://openalex.org/I82880672"]},{"raw_affiliation_string":"State Key Laboratory of Virtual Reality Technology and Systems, School of Computer Science and Engineering, Beihang University, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100337579","display_name":"Chen Wang","orcid":"https://orcid.org/0000-0002-4334-6103"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chen Wang","raw_affiliation_strings":["State Key Laboratory of Virtual Reality Technology and Systems, School of Computer Science and Engineering, Beihang University","State Key Laboratory of Virtual Reality Technology and Systems, School of Computer Science and Engineering, Beihang University, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Virtual Reality Technology and Systems, School of Computer Science and Engineering, Beihang University","institution_ids":["https://openalex.org/I82880672"]},{"raw_affiliation_string":"State Key Laboratory of Virtual Reality Technology and Systems, School of Computer Science and Engineering, Beihang University, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053599124","display_name":"Changqun Xia","orcid":"https://orcid.org/0000-0002-9594-5693"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Changqun Xia","raw_affiliation_strings":["State Key Laboratory of Virtual Reality Technology and Systems, School of Computer Science and Engineering, Beihang University","State Key Laboratory of Virtual Reality Technology and Systems, School of Computer Science and Engineering, Beihang University, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Virtual Reality Technology and Systems, School of Computer Science and Engineering, Beihang University","institution_ids":["https://openalex.org/I82880672"]},{"raw_affiliation_string":"State Key Laboratory of Virtual Reality Technology and Systems, School of Computer Science and Engineering, Beihang University, China","institution_ids":["https://openalex.org/I82880672"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100651152"],"corresponding_institution_ids":["https://openalex.org/I82880672"],"apc_list":null,"apc_paid":null,"fwci":8.6103,"has_fulltext":false,"cited_by_count":77,"citation_normalized_percentile":{"value":0.98469798,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"3641","last_page":"3649"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.827515721321106},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7708374261856079},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7590609788894653},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.6206381916999817},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6164725422859192},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5857029557228088},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.5531139969825745},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.5441641807556152},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.4950815737247467},{"id":"https://openalex.org/keywords/scale-space-segmentation","display_name":"Scale-space segmentation","score":0.46532365679740906},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4552769064903259},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.44851449131965637},{"id":"https://openalex.org/keywords/segmentation-based-object-categorization","display_name":"Segmentation-based object categorization","score":0.4477512836456299}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.827515721321106},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7708374261856079},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7590609788894653},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.6206381916999817},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6164725422859192},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5857029557228088},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.5531139969825745},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.5441641807556152},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.4950815737247467},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.46532365679740906},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4552769064903259},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.44851449131965637},{"id":"https://openalex.org/C25694479","wikidata":"https://www.wikidata.org/wiki/Q7446278","display_name":"Segmentation-based object categorization","level":5,"score":0.4477512836456299},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/cvpr.2015.7298987","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr.2015.7298987","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.912.6619","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.912.6619","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cv-foundation.org/openaccess/content_cvpr_2015/papers/Zhang_Semantic_Object_Segmentation_2015_CVPR_paper.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W44380796","https://openalex.org/W95258188","https://openalex.org/W122025198","https://openalex.org/W589665618","https://openalex.org/W1560354729","https://openalex.org/W1610707153","https://openalex.org/W1973054923","https://openalex.org/W1977545325","https://openalex.org/W1981667613","https://openalex.org/W1989348325","https://openalex.org/W2033959528","https://openalex.org/W2034740917","https://openalex.org/W2044373869","https://openalex.org/W2046382188","https://openalex.org/W2060475276","https://openalex.org/W2061202859","https://openalex.org/W2074753351","https://openalex.org/W2083597815","https://openalex.org/W2087570216","https://openalex.org/W2105297725","https://openalex.org/W2113708607","https://openalex.org/W2124351162","https://openalex.org/W2127194945","https://openalex.org/W2131720600","https://openalex.org/W2137881638","https://openalex.org/W2138682569","https://openalex.org/W2154644822","https://openalex.org/W2155598147","https://openalex.org/W2168356304","https://openalex.org/W2294631093","https://openalex.org/W3021229333","https://openalex.org/W4213060235","https://openalex.org/W4302039860","https://openalex.org/W6601799289","https://openalex.org/W6603540024","https://openalex.org/W6604983209","https://openalex.org/W6632547051","https://openalex.org/W6633569709","https://openalex.org/W6636212864"],"related_works":["https://openalex.org/W3144569342","https://openalex.org/W2185902295","https://openalex.org/W2945274617","https://openalex.org/W2103507220","https://openalex.org/W2055202857","https://openalex.org/W1999008862","https://openalex.org/W2371519352","https://openalex.org/W4205800335","https://openalex.org/W2386644571","https://openalex.org/W2551987074"],"abstract_inverted_index":{"Semantic":[0],"object":[1,50,65,88,117],"segmentation":[2,80,118],"in":[3,45],"video":[4,48,57],"is":[5,60],"an":[6,39],"important":[7],"step":[8],"for":[9],"large-scale":[10],"multimedia":[11],"analysis.":[12],"In":[13,52],"many":[14],"cases,":[15],"however,":[16],"semantic":[17,43,111],"objects":[18,44],"are":[19,90],"only":[20],"tagged":[21],"at":[22],"video-level,":[23],"making":[24],"them":[25],"difficult":[26],"to":[27,41,73],"be":[28],"located":[29],"and":[30,66,79,142,152],"segmented.":[31],"To":[32],"address":[33],"this":[34,36],"problem,":[35],"paper":[37],"proposes":[38],"approach":[40],"segment":[42],"weakly":[46],"labeled":[47],"via":[49],"detection.":[51],"our":[53,148],"approach,":[54],"a":[55,75,95],"novel":[56],"segmentation-by-detection":[58],"framework":[59],"proposed,":[61],"which":[62],"first":[63],"incorporates":[64],"region":[67],"detectors":[68],"pre-trained":[69],"on":[70,83,139],"still":[71],"images":[72],"generate":[74],"set":[76],"of":[77,110,129,135],"detection":[78],"proposals.":[81],"Based":[82],"the":[84,116,121,126,132],"noisy":[85],"proposals,":[86],"several":[87],"tracks":[89,105],"then":[91],"initialized":[92],"by":[93,124],"solving":[94],"joint":[96],"binary":[97],"optimization":[98],"problem":[99],"with":[100],"min-cost":[101],"flow.":[102],"As":[103],"such":[104],"actually":[106],"provide":[107],"rough":[108],"configurations":[109],"objects,":[112],"we":[113],"thus":[114],"refine":[115],"while":[119],"preserving":[120],"spatiotemporal":[122],"consistency":[123],"inferring":[125],"shape":[127],"likelihoods":[128],"pixels":[130],"from":[131],"statistical":[133],"information":[134],"tracks.":[136],"Experimental":[137],"results":[138],"Youtube-Objects":[140],"dataset":[141,145],"SegTrack":[143],"v2":[144],"demonstrate":[146],"that":[147],"method":[149],"outperforms":[150],"state-of-the-arts":[151],"shows":[153],"impressive":[154],"results.":[155]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":11},{"year":2019,"cited_by_count":10},{"year":2018,"cited_by_count":8},{"year":2017,"cited_by_count":21},{"year":2016,"cited_by_count":16},{"year":2015,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
