{"id":"https://openalex.org/W7136778164","doi":"https://doi.org/10.48550/arxiv.2603.12708","title":"HFP-SAM: Hierarchical Frequency Prompted SAM for Efficient Marine Animal Segmentation","display_name":"HFP-SAM: Hierarchical Frequency Prompted SAM for Efficient Marine Animal Segmentation","publication_year":2026,"publication_date":"2026-03-13","ids":{"openalex":"https://openalex.org/W7136778164","doi":"https://doi.org/10.48550/arxiv.2603.12708"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.12708","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.12708","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.12708","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129576971","display_name":"Pingping Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Pingping","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009706910","display_name":"Tianyu Yan","orcid":"https://orcid.org/0009-0003-1228-8072"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yan, Tianyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129481854","display_name":"Yuhao Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yuhao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129600228","display_name":"Yang Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Yang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129559805","display_name":"Tongdan Tang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Tongdan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129621162","display_name":"Yili Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Yili","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129430435","display_name":"Long Lv","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lv, Long","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129461936","display_name":"Feng Tian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tian, Feng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129629839","display_name":"Weibing Sun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Weibing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129579406","display_name":"and Huchuan Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, and Huchuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.8364999890327454,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.8364999890327454,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12316","display_name":"Oil Spill Detection and Mitigation","score":0.018200000748038292,"subfield":{"id":"https://openalex.org/subfields/2310","display_name":"Pollution"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.011300000362098217,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7360000014305115},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.4717000126838684},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4474000036716461},{"id":"https://openalex.org/keywords/frequency-domain","display_name":"Frequency domain","score":0.40639999508857727},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4050999879837036},{"id":"https://openalex.org/keywords/market-segmentation","display_name":"Market segmentation","score":0.3831000030040741},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.3790000081062317},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.325300008058548}],"concepts":[{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7360000014305115},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7278000116348267},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.604200005531311},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.4717000126838684},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4474000036716461},{"id":"https://openalex.org/C19118579","wikidata":"https://www.wikidata.org/wiki/Q786423","display_name":"Frequency domain","level":2,"score":0.40639999508857727},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4050999879837036},{"id":"https://openalex.org/C125308379","wikidata":"https://www.wikidata.org/wiki/Q363057","display_name":"Market segmentation","level":2,"score":0.3831000030040741},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.3790000081062317},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.33180001378059387},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.325300008058548},{"id":"https://openalex.org/C177284502","wikidata":"https://www.wikidata.org/wiki/Q1005390","display_name":"Adapter (computing)","level":2,"score":0.3109000027179718},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.3028999865055084},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.29120001196861267},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2800999879837036},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.2800000011920929},{"id":"https://openalex.org/C97118885","wikidata":"https://www.wikidata.org/wiki/Q565636","display_name":"Frequency analysis","level":2,"score":0.27320000529289246},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.2547999918460846},{"id":"https://openalex.org/C2780586970","wikidata":"https://www.wikidata.org/wiki/Q1357284","display_name":"Popularity","level":2,"score":0.251800000667572}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.12708","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.12708","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.12708","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.12708","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.8346360325813293,"id":"https://metadata.un.org/sdg/14","display_name":"Life below water"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Marine":[0],"Animal":[1],"Segmentation":[2],"(MAS)":[3],"aims":[4],"at":[5,172],"identifying":[6],"and":[7,47,121,145],"segmenting":[8],"marine":[9,13,79],"animals":[10],"from":[11],"complex":[12],"environments.":[14],"Most":[15],"of":[16,43,115,163],"previous":[17],"deep":[18],"learning-based":[19],"MAS":[20],"methods":[21],"struggle":[22],"with":[23,111,149],"the":[24,83,112,160],"long-distance":[25],"modeling":[26],"issue.":[27],"Recently,":[28],"Segment":[29],"Anything":[30],"Model":[31],"(SAM)":[32],"has":[33],"gained":[34],"popularity":[35],"in":[36],"general":[37],"image":[38],"segmentation.":[39],"However,":[40],"it":[41],"lacks":[42],"perceiving":[44],"fine-grained":[45],"details":[46],"frequency":[48,88,105],"information.":[49],"To":[50],"this":[51],"end,":[52],"we":[53,69,93,135],"propose":[54],"a":[55,71,95,137],"novel":[56],"learning":[57],"framework,":[58],"named":[59],"Hierarchical":[60],"Frequency":[61,72],"Prompted":[62],"SAM":[63,85,116],"(HFP-SAM)":[64],"for":[65,126],"high-performance":[66],"MAS.":[67],"First,":[68],"design":[70],"Guided":[73],"Adapter":[74],"(FGA)":[75],"to":[76,100,117,130,141],"efficiently":[77,142],"inject":[78],"scene":[80],"information":[81,148],"into":[82,123],"frozen":[84],"backbone":[86],"through":[87,104],"domain":[89],"prior":[90],"masks.":[91],"Additionally,":[92],"introduce":[94,136],"Frequency-aware":[96],"Point":[97],"Selection":[98],"(FPS)":[99],"generate":[101,118],"highlighted":[102],"regions":[103,108],"analysis.":[106],"These":[107],"are":[109],"combined":[110],"coarse":[113],"predictions":[114],"point":[119],"prompts":[120],"integrate":[122],"SAM's":[124],"decoder":[125],"fine":[127],"predictions.":[128],"Finally,":[129],"obtain":[131],"comprehensive":[132],"segmentation":[133],"masks,":[134],"Full-View":[138],"Mamba":[139],"(FVM)":[140],"extract":[143],"spatial":[144],"channel":[146],"contextual":[147],"linear":[150],"computational":[151],"complexity.":[152],"Extensive":[153],"experiments":[154],"on":[155],"four":[156],"public":[157],"datasets":[158],"demonstrate":[159],"superior":[161],"performance":[162],"our":[164],"approach.":[165],"The":[166],"source":[167],"code":[168],"is":[169],"publicly":[170],"available":[171],"https://github.com/Drchip61/TIP-HFP-SAM.":[173]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-17T00:00:00"}
