{"id":"https://openalex.org/W7116962048","doi":"https://doi.org/10.48550/arxiv.2512.17514","title":"Foundation Model Priors Enhance Object Focus in Feature Space for Source-Free Object Detection","display_name":"Foundation Model Priors Enhance Object Focus in Feature Space for Source-Free Object Detection","publication_year":2025,"publication_date":"2025-12-19","ids":{"openalex":"https://openalex.org/W7116962048","doi":"https://doi.org/10.48550/arxiv.2512.17514"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2512.17514","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5121063573","display_name":"Sairam VCR","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"VCR, Sairam","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038480708","display_name":"Rishabh Lalla","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lalla, Rishabh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076329713","display_name":"Aveen Dayal","orcid":"https://orcid.org/0000-0001-6792-9170"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dayal, Aveen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090991932","display_name":"Tejal Kulkarni","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kulkarni, Tejal","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121055588","display_name":"Anuj Lalla","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lalla, Anuj","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038020125","display_name":"Vineeth N Balasubramanian","orcid":"https://orcid.org/0000-0003-2656-0375"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Balasubramanian, Vineeth N","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5000709367","display_name":"Muhammad Haris Khan","orcid":"https://orcid.org/0009-0005-1112-0280"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Khan, Muhammad Haris","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.7416999936103821,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.7416999936103821,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.15150000154972076,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.03779999911785126,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.6061000227928162},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.6032999753952026},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5848000049591064},{"id":"https://openalex.org/keywords/clutter","display_name":"Clutter","score":0.5662000179290771},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.5494999885559082},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5307000279426575},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.48010000586509705},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.4657000005245209},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.44029998779296875}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6937000155448914},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6748999953269958},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.6061000227928162},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.6032999753952026},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5848000049591064},{"id":"https://openalex.org/C132094186","wikidata":"https://www.wikidata.org/wiki/Q641585","display_name":"Clutter","level":3,"score":0.5662000179290771},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.5494999885559082},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5307000279426575},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5171999931335449},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.48010000586509705},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.4657000005245209},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.44029998779296875},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.43220001459121704},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.4205000102519989},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.40540000796318054},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3921999931335449},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.38019999861717224},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.36239999532699585},{"id":"https://openalex.org/C2776698545","wikidata":"https://www.wikidata.org/wiki/Q2374641","display_name":"Spar","level":2,"score":0.3458999991416931},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.3411000072956085},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.32670000195503235},{"id":"https://openalex.org/C182521987","wikidata":"https://www.wikidata.org/wiki/Q2493877","display_name":"Viola\u2013Jones object detection framework","level":5,"score":0.3215000033378601},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.32100000977516174},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3149999976158142},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.3073999881744385},{"id":"https://openalex.org/C66905080","wikidata":"https://www.wikidata.org/wiki/Q17005494","display_name":"Binary classification","level":3,"score":0.30320000648498535},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.29030001163482666},{"id":"https://openalex.org/C2776434776","wikidata":"https://www.wikidata.org/wiki/Q19246213","display_name":"Domain adaptation","level":3,"score":0.27390000224113464},{"id":"https://openalex.org/C29265498","wikidata":"https://www.wikidata.org/wiki/Q7047719","display_name":"Noise measurement","level":3,"score":0.265500009059906},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.26440000534057617}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2512.17514","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2512.17514","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.17514","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2512.17514","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.6489356160163879,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Current":[0],"state-of-the-art":[1],"approaches":[2],"in":[3,37],"Source-Free":[4],"Object":[5],"Detection":[6],"(SFOD)":[7],"typically":[8],"rely":[9],"on":[10],"Mean-Teacher":[11],"self-labeling.":[12],"However,":[13],"domain":[14,81],"shift":[15],"often":[16],"reduces":[17],"the":[18,41,53,58,94,103,122],"detector's":[19,104],"ability":[20],"to":[21,56,76,101,153],"maintain":[22],"strong":[23],"object-focused":[24,78],"representations,":[25],"causing":[26],"high-confidence":[27],"activations":[28,119],"over":[29],"background":[30],"clutter.":[31],"This":[32],"weak":[33],"object":[34,125],"focus":[35],"results":[36],"unreliable":[38],"pseudo-labels":[39],"from":[40,112],"detection":[42],"head.":[43],"While":[44],"prior":[45],"works":[46],"mainly":[47],"refine":[48],"these":[49,151],"pseudo-labels,":[50],"they":[51],"overlook":[52],"underlying":[54],"need":[55],"strengthen":[57],"feature":[59,105],"space":[60],"itself.":[61],"We":[62],"propose":[63],"FALCON-SFOD":[64,160],"(Foundation-Aligned":[65],"Learning":[66],"with":[67],"Clutter":[68],"suppression":[69],"and":[70,117,137,156],"Noise":[71,129],"robustness),":[72],"a":[73,146],"framework":[74],"designed":[75],"enhance":[77],"adaptation":[79],"under":[80,140],"shift.":[82],"It":[83],"consists":[84],"of":[85,97],"two":[86],"complementary":[87],"components.":[88],"SPAR":[89,114,133],"(Spatial":[90],"Prior-Aware":[91],"Regularization)":[92],"leverages":[93],"generalization":[95],"strength":[96],"vision":[98],"foundation":[99],"models":[100],"regularize":[102],"space.":[106],"Using":[107],"class-agnostic":[108],"binary":[109],"masks":[110],"derived":[111],"OV-SAM,":[113],"promotes":[115],"structured":[116],"foreground-focused":[118],"by":[120,134,145],"guiding":[121],"network":[123],"toward":[124],"regions.":[126],"IRPL":[127],"(Imbalance-aware":[128],"Robust":[130],"Pseudo-Labeling)":[131],"complements":[132],"promoting":[135],"balanced":[136],"noise-tolerant":[138],"learning":[139],"severe":[141],"foreground-background":[142],"imbalance.":[143],"Guided":[144],"theoretical":[147],"analysis":[148],"that":[149],"connects":[150],"designs":[152],"tighter":[154],"localization":[155],"classification":[157],"error":[158],"bounds,":[159],"achieves":[161],"competitive":[162],"performance":[163],"across":[164],"SFOD":[165],"benchmarks.":[166]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-12-23T00:00:00"}
