{"id":"https://openalex.org/W4392490746","doi":"https://doi.org/10.48550/arxiv.2403.01214","title":"Boosting Box-supervised Instance Segmentation with Pseudo Depth","display_name":"Boosting Box-supervised Instance Segmentation with Pseudo Depth","publication_year":2024,"publication_date":"2024-03-02","ids":{"openalex":"https://openalex.org/W4392490746","doi":"https://doi.org/10.48550/arxiv.2403.01214"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2403.01214","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2403.01214","pdf_url":"https://arxiv.org/pdf/2403.01214","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2403.01214","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101978641","display_name":"Xinyi Yu","orcid":"https://orcid.org/0000-0002-5268-7401"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yu, Xinyi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113134790","display_name":"Ling Yan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yan, Ling","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108638480","display_name":"Pengtao Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Pengtao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100353596","display_name":"Hao Chen","orcid":"https://orcid.org/0000-0002-8400-3780"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Hao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046508099","display_name":"Bo Li","orcid":"https://orcid.org/0000-0002-1415-4444"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Bo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083453098","display_name":"Lin Wu","orcid":"https://orcid.org/0000-0001-6119-058X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Lin Yuanbo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5101893352","display_name":"Linlin Ou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ou, Linlin","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5101978641"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9786999821662903,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9786999821662903,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.9416999816894531,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12549","display_name":"Image and Object Detection Techniques","score":0.9210000038146973,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/boosting","display_name":"Boosting (machine learning)","score":0.8126937747001648},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7314474582672119},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6265767812728882},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5377026200294495},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4417562782764435},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3876502811908722}],"concepts":[{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.8126937747001648},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7314474582672119},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6265767812728882},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5377026200294495},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4417562782764435},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3876502811908722}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2403.01214","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2403.01214","pdf_url":"https://arxiv.org/pdf/2403.01214","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2403.01214","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2403.01214","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2403.01214","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2403.01214","pdf_url":"https://arxiv.org/pdf/2403.01214","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4392490746.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W3082059448","https://openalex.org/W4313640622","https://openalex.org/W3046775127","https://openalex.org/W3107602296","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W4364306694","https://openalex.org/W4312192474"],"abstract_inverted_index":{"The":[0,180],"realm":[1],"of":[2,24,59],"Weakly":[3],"Supervised":[4],"Instance":[5],"Segmentation":[6],"(WSIS)":[7],"under":[8],"box":[9,25,166],"supervision":[10,26,151],"has":[11],"garnered":[12],"substantial":[13],"attention,":[14],"showcasing":[15],"remarkable":[16],"advancements":[17],"in":[18,29,146],"recent":[19],"years.":[20],"However,":[21],"the":[22,42,56,60,90,95,111,119,136,143,147,154,157,161,168],"limitations":[23],"become":[27],"apparent":[28],"its":[30,66,128],"inability":[31],"to":[32,97,121,130,152],"furnish":[33],"effective":[34],"information":[35,134],"for":[36,164],"distinguishing":[37],"foreground":[38,155],"from":[39,156],"background":[40],"within":[41],"specified":[43],"target":[44],"box.":[45],"This":[46,115],"research":[47],"addresses":[48],"this":[49],"challenge":[50],"by":[51,68],"introducing":[52],"pseudo-depth":[53,75],"maps":[54,76],"into":[55,110],"training":[57,148],"process":[58,149],"instance":[61,137],"segmentation":[62,138],"network,":[63],"thereby":[64],"boosting":[65],"performance":[67],"capturing":[69],"depth":[70,83,99,107,173],"differences":[71],"between":[72],"instances.":[73],"These":[74],"are":[77,86],"generated":[78,145],"using":[79],"a":[80,106],"readily":[81],"available":[82],"predictor":[84],"and":[85,125,188],"not":[87],"necessary":[88],"during":[89,135],"inference":[91],"stage.":[92],"To":[93],"enable":[94],"network":[96,120],"discern":[98],"features":[100],"when":[101],"predicting":[102],"masks,":[103],"we":[104,171],"integrate":[105],"prediction":[108,113],"layer":[109],"mask":[112,144,163],"head.":[114],"innovative":[116],"approach":[117],"empowers":[118],"simultaneously":[122],"predict":[123],"masks":[124],"depth,":[126],"enhancing":[127],"ability":[129],"capture":[131],"nuanced":[132],"depth-related":[133],"process.":[139],"We":[140],"further":[141],"utilize":[142],"as":[150,175],"distinguish":[153],"background.":[158],"When":[159],"selecting":[160],"best":[162],"each":[165],"through":[167],"Hungarian":[169],"algorithm,":[170],"use":[172],"consistency":[174],"one":[176],"calculation":[177],"cost":[178],"item.":[179],"proposed":[181],"method":[182],"achieves":[183],"significant":[184],"improvements":[185],"on":[186],"Cityscapes":[187],"COCO":[189],"dataset.":[190]},"counts_by_year":[],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
