{"id":"https://openalex.org/W7135181947","doi":"https://doi.org/10.1109/iccp68926.2025.11427110","title":"Enhancing Mask R-CNN to Improve Camouflaged Object Detection","display_name":"Enhancing Mask R-CNN to Improve Camouflaged Object Detection","publication_year":2025,"publication_date":"2025-10-16","ids":{"openalex":"https://openalex.org/W7135181947","doi":"https://doi.org/10.1109/iccp68926.2025.11427110"},"language":null,"primary_location":{"id":"doi:10.1109/iccp68926.2025.11427110","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccp68926.2025.11427110","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE 21st International Conference on Intelligent Computer Communication and Processing (ICCP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128965330","display_name":"Maria Zuba\u015fcu","orcid":null},"institutions":[{"id":"https://openalex.org/I158333966","display_name":"Technical University of Cluj-Napoca","ror":"https://ror.org/03r8nwp71","country_code":"RO","type":"education","lineage":["https://openalex.org/I158333966"]}],"countries":["RO"],"is_corresponding":true,"raw_author_name":"Maria Zuba\u015fcu","raw_affiliation_strings":["Technical University of Cluj-Napoca,Computer Science Department,Cluj-Napoca,Romania"],"affiliations":[{"raw_affiliation_string":"Technical University of Cluj-Napoca,Computer Science Department,Cluj-Napoca,Romania","institution_ids":["https://openalex.org/I158333966"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042712140","display_name":"Cristian Vancea","orcid":"https://orcid.org/0000-0003-0270-1962"},"institutions":[{"id":"https://openalex.org/I158333966","display_name":"Technical University of Cluj-Napoca","ror":"https://ror.org/03r8nwp71","country_code":"RO","type":"education","lineage":["https://openalex.org/I158333966"]}],"countries":["RO"],"is_corresponding":false,"raw_author_name":"Cristian-Cosmin Vancea","raw_affiliation_strings":["Technical University of Cluj-Napoca,Computer Science Department,Cluj-Napoca,Romania"],"affiliations":[{"raw_affiliation_string":"Technical University of Cluj-Napoca,Computer Science Department,Cluj-Napoca,Romania","institution_ids":["https://openalex.org/I158333966"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5128965330"],"corresponding_institution_ids":["https://openalex.org/I158333966"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.76730265,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.5311999917030334,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.5311999917030334,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.11159999668598175,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11707","display_name":"Gaze Tracking and Assistive Technology","score":0.049800001084804535,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.49549999833106995},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4009000062942505},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.3305000066757202},{"id":"https://openalex.org/keywords/image-processing","display_name":"Image processing","score":0.30059999227523804},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.296999990940094},{"id":"https://openalex.org/keywords/edge-detection","display_name":"Edge detection","score":0.2922999858856201}],"concepts":[{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6144999861717224},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6003000140190125},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5543000102043152},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.49549999833106995},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4009000062942505},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.3305000066757202},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.30059999227523804},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.296999990940094},{"id":"https://openalex.org/C193536780","wikidata":"https://www.wikidata.org/wiki/Q1513153","display_name":"Edge detection","level":4,"score":0.2922999858856201},{"id":"https://openalex.org/C2776196576","wikidata":"https://www.wikidata.org/wiki/Q196113","display_name":"Camouflage","level":2,"score":0.28279998898506165},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2667999863624573},{"id":"https://openalex.org/C4641261","wikidata":"https://www.wikidata.org/wiki/Q11681085","display_name":"Face detection","level":4,"score":0.25619998574256897},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.25040000677108765},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.2502000033855438}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iccp68926.2025.11427110","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccp68926.2025.11427110","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE 21st International Conference on Intelligent Computer Communication and Processing (ICCP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1861492603","https://openalex.org/W2047597695","https://openalex.org/W2133393886","https://openalex.org/W2194775991","https://openalex.org/W2549139847","https://openalex.org/W2565639579","https://openalex.org/W2808725022","https://openalex.org/W2884436604","https://openalex.org/W2906700625","https://openalex.org/W2928165649","https://openalex.org/W2963037989","https://openalex.org/W2963150697","https://openalex.org/W2963868681","https://openalex.org/W2972006294","https://openalex.org/W3034684132","https://openalex.org/W3039368862","https://openalex.org/W3091762720","https://openalex.org/W3163825518","https://openalex.org/W3177165656","https://openalex.org/W3203700770","https://openalex.org/W4312258849","https://openalex.org/W4313023779","https://openalex.org/W4401328675","https://openalex.org/W4403420280","https://openalex.org/W4405490583","https://openalex.org/W4411871400"],"related_works":[],"abstract_inverted_index":{"Camouflaged":[0],"Object":[1],"Detection":[2],"(COD)":[3],"involves":[4],"identifying":[5],"and":[6,124,188],"segmenting":[7],"objects":[8],"that":[9,57,163],"become":[10],"part":[11],"of":[12,177],"the":[13,42,99,115,153,159,175],"background.":[14],"It":[15],"is":[16],"a":[17,63,105,147,165],"complicated":[18],"task":[19],"for":[20,49],"Computer":[21],"Vision,":[22],"which":[23,110],"requires":[24],"techniques":[25],"able":[26],"to":[27,74,145,152],"exploit":[28],"visual":[29],"features":[30],"beyond":[31],"human":[32],"eye":[33],"capabilities.":[34],"Traditional":[35],"methods":[36],"using":[37,67,114,135,164],"pixel-wise":[38],"local":[39],"analysis":[40],"in":[41,78],"RGB":[43],"color":[44],"space":[45],"are":[46],"usually":[47],"insufficient":[48],"this":[50],"task.":[51,155],"After":[52],"comprehensive":[53],"testing,":[54],"we":[55],"noticed":[56],"Mask":[58,89,179],"R-CNN":[59,90,180],"models,":[60],"provided":[61],"with":[62,91,169,181],"supporting":[64],"attention":[65,112],"map":[66],"Discrete":[68],"Cosine":[69],"Transform":[70],"(DCT)":[71],"information,":[72],"proved":[73],"be":[75],"more":[76],"accurate":[77],"detecting":[79],"camouflaged":[80],"objects.":[81],"We":[82,120,140],"developed":[83],"five":[84],"original":[85],"models":[86,100,127,132],"based":[87,107],"on":[88,108,128,158,184,190],"different":[92],"backbones,":[93],"including":[94],"ResNet-50,":[95],"Res2Net,":[96],"ResNeXt.":[97],"Additionally,":[98],"were":[101,133],"enhanced":[102],"by":[103],"inserting":[104],"module":[106,173],"DCT,":[109],"generates":[111],"maps":[113],"Self-Attention":[116,172],"mechanism":[117],"from":[118],"Transformers.":[119],"used":[121],"pre-trained":[122],"backbones":[123],"trained":[125],"our":[126,170],"COD10K":[129,160],"dataset.":[130],"The":[131],"evaluated":[134],"standard":[136,178],"COCO":[137],"IoU-based":[138],"metrics.":[139],"also":[141],"adopted":[142],"Structure":[143,191],"Measure":[144],"assess":[146],"superior":[148],"qualitative":[149],"examination":[150],"specific":[151],"segmentation":[154],"Experiments":[156],"conducted":[157],"dataset":[161],"demonstrate":[162],"ResNet-50":[166],"backbone":[167],"combined":[168],"DCT":[171],"improves":[174],"performance":[176],"approximately":[182],"0.08":[183],"$\\mathrm{AP}":[185],"\\text{@}":[186],"0.5$":[187],"0.03":[189],"Measure.":[192]},"counts_by_year":[],"updated_date":"2026-03-15T07:15:06.534987","created_date":"2026-03-14T00:00:00"}
