{"id":"https://openalex.org/W4409076560","doi":"https://doi.org/10.1109/tip.2025.3555073","title":"Object Adaptive Self-Supervised Dense Visual Pre-Training","display_name":"Object Adaptive Self-Supervised Dense Visual Pre-Training","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4409076560","doi":"https://doi.org/10.1109/tip.2025.3555073","pmid":"https://pubmed.ncbi.nlm.nih.gov/40168204"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2025.3555073","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2025.3555073","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100433666","display_name":"Yu Zhang","orcid":"https://orcid.org/0000-0003-0140-7366"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yu Zhang","raw_affiliation_strings":["School of Computer Science and Engineering and the Key Laboratory of Computer Network and Information Integration (Ministry of Education), Southeast University, Nanjing, China","School of Computer Science and Engineering, and the Key Lab of Computer Network and Information Integration (Ministry of Education), Southeast University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering and the Key Laboratory of Computer Network and Information Integration (Ministry of Education), Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]},{"raw_affiliation_string":"School of Computer Science and Engineering, and the Key Lab of Computer Network and Information Integration (Ministry of Education), Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100375754","display_name":"Tao Zhang","orcid":"https://orcid.org/0000-0001-9955-3905"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tao Zhang","raw_affiliation_strings":["School of Computer Science and Engineering and the Key Laboratory of Computer Network and Information Integration (Ministry of Education), Southeast University, Nanjing, China","School of Computer Science and Engineering, and the Key Lab of Computer Network and Information Integration (Ministry of Education), Southeast University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering and the Key Laboratory of Computer Network and Information Integration (Ministry of Education), Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]},{"raw_affiliation_string":"School of Computer Science and Engineering, and the Key Lab of Computer Network and Information Integration (Ministry of Education), Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015639955","display_name":"Hongyuan Zhu","orcid":"https://orcid.org/0000-0001-5177-8320"},"institutions":[{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]},{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Hongyuan Zhu","raw_affiliation_strings":["Institute for Infocomm Research (I2R), A*STAR, Fusionopolis, Singapore","A*STAR, Institute of Infocomm Research (I2R), Singapore"],"affiliations":[{"raw_affiliation_string":"Institute for Infocomm Research (I2R), A*STAR, Fusionopolis, Singapore","institution_ids":["https://openalex.org/I3005327000"]},{"raw_affiliation_string":"A*STAR, Institute of Infocomm Research (I2R), Singapore","institution_ids":["https://openalex.org/I3005327000","https://openalex.org/I115228651"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100679784","display_name":"Zihan Chen","orcid":"https://orcid.org/0000-0001-5871-7766"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zihan Chen","raw_affiliation_strings":["School of Computer Science and Engineering and the Key Laboratory of Computer Network and Information Integration (Ministry of Education), Southeast University, Nanjing, China","School of Computer Science and Engineering, and the Key Lab of Computer Network and Information Integration (Ministry of Education), Southeast University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering and the Key Laboratory of Computer Network and Information Integration (Ministry of Education), Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]},{"raw_affiliation_string":"School of Computer Science and Engineering, and the Key Lab of Computer Network and Information Integration (Ministry of Education), Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049776286","display_name":"Siya Mi","orcid":"https://orcid.org/0000-0003-1751-7076"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Siya Mi","raw_affiliation_strings":["School of Cyber Science and Engineering, Southeast University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"School of Cyber Science and Engineering, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022800038","display_name":"Xi Peng","orcid":"https://orcid.org/0000-0002-5727-2790"},"institutions":[{"id":"https://openalex.org/I24185976","display_name":"Sichuan University","ror":"https://ror.org/011ashp19","country_code":"CN","type":"education","lineage":["https://openalex.org/I24185976"]},{"id":"https://openalex.org/I4210125143","display_name":"Chengdu University","ror":"https://ror.org/034z67559","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210125143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xi Peng","raw_affiliation_strings":["School of Computer Science, Sichuan University, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, Sichuan University, Chengdu, China","institution_ids":["https://openalex.org/I4210125143","https://openalex.org/I24185976"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5074742406","display_name":"Xin Geng","orcid":"https://orcid.org/0000-0001-7729-0622"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Geng","raw_affiliation_strings":["School of Computer Science and Engineering and the Key Laboratory of Computer Network and Information Integration (Ministry of Education), Southeast University, Nanjing, China","School of Computer Science and Engineering, and the Key Lab of Computer Network and Information Integration (Ministry of Education), Southeast University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering and the Key Laboratory of Computer Network and Information Integration (Ministry of Education), Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]},{"raw_affiliation_string":"School of Computer Science and Engineering, and the Key Lab of Computer Network and Information Integration (Ministry of Education), Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5100433666"],"corresponding_institution_ids":["https://openalex.org/I76569877"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.04862839,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"34","issue":null,"first_page":"2228","last_page":"2240"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9776999950408936,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9776999950408936,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9343000054359436,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.932200014591217,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7137976288795471},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6864109039306641},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.61179518699646},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.5076977014541626},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.48865869641304016},{"id":"https://openalex.org/keywords/image-processing","display_name":"Image processing","score":0.478836327791214},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4478493928909302},{"id":"https://openalex.org/keywords/cognitive-neuroscience-of-visual-object-recognition","display_name":"Cognitive neuroscience of visual object recognition","score":0.4473334550857544},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.41543465852737427},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.26568078994750977}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7137976288795471},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6864109039306641},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.61179518699646},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.5076977014541626},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.48865869641304016},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.478836327791214},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4478493928909302},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.4473334550857544},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.41543465852737427},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.26568078994750977},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tip.2025.3555073","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2025.3555073","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:40168204","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40168204","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2286064317","display_name":null,"funder_award_id":"S22-19016-STDP","funder_id":"https://openalex.org/F4320337495","funder_display_name":"Technology Development"}],"funders":[{"id":"https://openalex.org/F4320337495","display_name":"Technology Development","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W1965301399","https://openalex.org/W2031489346","https://openalex.org/W2088049833","https://openalex.org/W2108598243","https://openalex.org/W2138621090","https://openalex.org/W2194775991","https://openalex.org/W2321533354","https://openalex.org/W2326925005","https://openalex.org/W2471138382","https://openalex.org/W2908696099","https://openalex.org/W2953231542","https://openalex.org/W2963420272","https://openalex.org/W2990873191","https://openalex.org/W3034781633","https://openalex.org/W3035524453","https://openalex.org/W3096609285","https://openalex.org/W3113317635","https://openalex.org/W3128661784","https://openalex.org/W3165924482","https://openalex.org/W3168822201","https://openalex.org/W3171007011","https://openalex.org/W3192404838","https://openalex.org/W3202407433","https://openalex.org/W4200139856","https://openalex.org/W4221166941","https://openalex.org/W4283030623","https://openalex.org/W4293677672","https://openalex.org/W4386047822","https://openalex.org/W4386083093","https://openalex.org/W4401024603","https://openalex.org/W6747899497","https://openalex.org/W6774314701","https://openalex.org/W6774670964","https://openalex.org/W6779326418","https://openalex.org/W6779997284","https://openalex.org/W6785786191","https://openalex.org/W6791437168","https://openalex.org/W6797255657","https://openalex.org/W6803893310"],"related_works":["https://openalex.org/W230091440","https://openalex.org/W2114275278","https://openalex.org/W4292830139","https://openalex.org/W4319309705","https://openalex.org/W1489511283","https://openalex.org/W2974914859","https://openalex.org/W2026565050","https://openalex.org/W2110244802","https://openalex.org/W2163728705","https://openalex.org/W949345935"],"abstract_inverted_index":{"Self-supervised":[0],"visual":[1,51],"pre-training":[2],"models":[3,16],"have":[4],"achieved":[5],"significant":[6],"success":[7],"without":[8],"employing":[9],"expensive":[10],"annotations.":[11],"Nevertheless,":[12],"most":[13,143],"of":[14,92],"these":[15],"focus":[17,84],"on":[18,54,129],"iconic":[19],"single-instance":[20],"datasets":[21,32,57],"(e.g.":[22,33],"ImageNet),":[23],"ignoring":[24],"the":[25,50,55,85,90,105,116,123],"insufficient":[26],"discriminative":[27],"representation":[28,52],"for":[29,63],"non-iconic":[30],"multi-instance":[31,56],"COCO).":[34],"In":[35,122],"this":[36],"paper,":[37],"we":[38,125],"propose":[39],"a":[40,75],"novel":[41,76],"Object":[42],"Adaptive":[43],"Dense":[44],"Pre-training":[45],"(OADP)":[46],"method":[47,117,138],"to":[48,83,88,97,149],"learn":[49,119],"directly":[53],"(e.g.,":[58,67],"PASCAL":[59,130],"VOC":[60,131],"and":[61,70,78,110,132,160],"COCO)":[62],"dense":[64],"prediction":[65],"tasks":[66],"object":[68,93,156],"detection":[69],"instance":[71,158],"segmentation).":[72],"We":[73],"present":[74],"object-aware":[77],"learning-adaptive":[79],"random":[80],"view":[81],"augmentation":[82],"contrastive":[86],"learning":[87,102],"enhance":[89],"discrimination":[91],"presentations":[94],"from":[95],"large":[96],"small":[98],"scale":[99,109],"during":[100],"different":[101,108],"stages.":[103],"Furthermore,":[104],"representations":[106],"across":[107],"resolutions":[111],"are":[112],"integrated":[113],"so":[114],"that":[115,136],"can":[118],"diverse":[120],"representations.":[121],"experiment,":[124],"evaluated":[126],"OADP":[127],"pre-trained":[128],"COCO.":[133],"Results":[134],"show":[135],"our":[137],"has":[139],"better":[140],"performances":[141],"than":[142],"existing":[144],"state-of-the-art":[145],"methods":[146],"when":[147],"transferring":[148],"various":[150],"downstream":[151],"tasks,":[152],"including":[153],"image":[154],"classification,":[155],"detection,":[157],"segmentation":[159],"semantic":[161],"segmentation.":[162]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
