{"id":"https://openalex.org/W7131128955","doi":"https://doi.org/10.1109/robio66223.2025.11377666","title":"Intestinal Robot-Based Abnormality Detection via Pixel-Level Annotation and Vision-Language Model Visualization","display_name":"Intestinal Robot-Based Abnormality Detection via Pixel-Level Annotation and Vision-Language Model Visualization","publication_year":2025,"publication_date":"2025-12-03","ids":{"openalex":"https://openalex.org/W7131128955","doi":"https://doi.org/10.1109/robio66223.2025.11377666"},"language":null,"primary_location":{"id":"doi:10.1109/robio66223.2025.11377666","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robio66223.2025.11377666","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Robotics and Biomimetics (ROBIO)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101726917","display_name":"Yufei Gao","orcid":"https://orcid.org/0000-0002-8737-8449"},"institutions":[{"id":"https://openalex.org/I39333907","display_name":"Yanshan University","ror":"https://ror.org/02txfnf15","country_code":"CN","type":"education","lineage":["https://openalex.org/I39333907"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yufei Gao","raw_affiliation_strings":["Engineering Research Center of the Ministry of Education for Intelligent Control System and Intelligent Equipment, Yanshan University,Qinhuangdao,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Engineering Research Center of the Ministry of Education for Intelligent Control System and Intelligent Equipment, Yanshan University,Qinhuangdao,China","institution_ids":["https://openalex.org/I39333907"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126647718","display_name":"Yang Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I39333907","display_name":"Yanshan University","ror":"https://ror.org/02txfnf15","country_code":"CN","type":"education","lineage":["https://openalex.org/I39333907"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Liu","raw_affiliation_strings":["Engineering Research Center of the Ministry of Education for Intelligent Control System and Intelligent Equipment, Yanshan University,Qinhuangdao,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Engineering Research Center of the Ministry of Education for Intelligent Control System and Intelligent Equipment, Yanshan University,Qinhuangdao,China","institution_ids":["https://openalex.org/I39333907"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066657129","display_name":"Changshun Xie","orcid":null},"institutions":[{"id":"https://openalex.org/I4210164246","display_name":"First Hospital of Qinhuangdao","ror":"https://ror.org/05pmkqv04","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210164246"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Changshun Xie","raw_affiliation_strings":["First Hospital of Qinhuangdao,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"First Hospital of Qinhuangdao,China","institution_ids":["https://openalex.org/I4210164246"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025965660","display_name":"Yuxuan Hou","orcid":"https://orcid.org/0000-0002-0880-6418"},"institutions":[{"id":"https://openalex.org/I39333907","display_name":"Yanshan University","ror":"https://ror.org/02txfnf15","country_code":"CN","type":"education","lineage":["https://openalex.org/I39333907"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuxuan Hou","raw_affiliation_strings":["Engineering Research Center of the Ministry of Education for Intelligent Control System and Intelligent Equipment, Yanshan University,Qinhuangdao,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Engineering Research Center of the Ministry of Education for Intelligent Control System and Intelligent Equipment, Yanshan University,Qinhuangdao,China","institution_ids":["https://openalex.org/I39333907"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126615441","display_name":"Junxian Feng","orcid":null},"institutions":[{"id":"https://openalex.org/I39333907","display_name":"Yanshan University","ror":"https://ror.org/02txfnf15","country_code":"CN","type":"education","lineage":["https://openalex.org/I39333907"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junxian Feng","raw_affiliation_strings":["Engineering Research Center of the Ministry of Education for Intelligent Control System and Intelligent Equipment, Yanshan University,Qinhuangdao,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Engineering Research Center of the Ministry of Education for Intelligent Control System and Intelligent Equipment, Yanshan University,Qinhuangdao,China","institution_ids":["https://openalex.org/I39333907"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103129337","display_name":"Shuhuan Wen","orcid":"https://orcid.org/0000-0002-7646-4958"},"institutions":[{"id":"https://openalex.org/I39333907","display_name":"Yanshan University","ror":"https://ror.org/02txfnf15","country_code":"CN","type":"education","lineage":["https://openalex.org/I39333907"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuhuan Wen","raw_affiliation_strings":["Engineering Research Center of the Ministry of Education for Intelligent Control System and Intelligent Equipment, Yanshan University,Qinhuangdao,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Engineering Research Center of the Ministry of Education for Intelligent Control System and Intelligent Equipment, Yanshan University,Qinhuangdao,China","institution_ids":["https://openalex.org/I39333907"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126627559","display_name":"Huibin Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I39333907","display_name":"Yanshan University","ror":"https://ror.org/02txfnf15","country_code":"CN","type":"education","lineage":["https://openalex.org/I39333907"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huibin Lu","raw_affiliation_strings":["Engineering Research Center of the Ministry of Education for Intelligent Control System and Intelligent Equipment, Yanshan University,Qinhuangdao,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Engineering Research Center of the Ministry of Education for Intelligent Control System and Intelligent Equipment, Yanshan University,Qinhuangdao,China","institution_ids":["https://openalex.org/I39333907"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126652130","display_name":"Qichao Zhao","orcid":null},"institutions":[{"id":"https://openalex.org/I6469544","display_name":"City University of Macau","ror":"https://ror.org/04gpd4q15","country_code":"MO","type":"education","lineage":["https://openalex.org/I6469544"]}],"countries":["MO"],"is_corresponding":false,"raw_author_name":"Qichao Zhao","raw_affiliation_strings":["International(Macau)Institute of Academic Research"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"International(Macau)Institute of Academic Research","institution_ids":["https://openalex.org/I6469544"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5126599668","display_name":"Hong Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I3045169105","display_name":"Southern University of Science and Technology","ror":"https://ror.org/049tv2d57","country_code":"CN","type":"education","lineage":["https://openalex.org/I3045169105"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hong Zhang","raw_affiliation_strings":["Southern University of Science and Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Southern University of Science and Technology","institution_ids":["https://openalex.org/I3045169105"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.65628054,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1668","last_page":"1673"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.30720001459121704,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.30720001459121704,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11775","display_name":"COVID-19 diagnosis using AI","score":0.1347000002861023,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.03830000013113022,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.9369000196456909},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.8014000058174133},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.6499000191688538},{"id":"https://openalex.org/keywords/anomaly-detection","display_name":"Anomaly detection","score":0.4697999954223633},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.4499000012874603},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.4284000098705292},{"id":"https://openalex.org/keywords/abnormality","display_name":"Abnormality","score":0.42149999737739563}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.9369000196456909},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.8014000058174133},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7621999979019165},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.6499000191688538},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5501999855041504},{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.4697999954223633},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.4499000012874603},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.4284000098705292},{"id":"https://openalex.org/C50965678","wikidata":"https://www.wikidata.org/wiki/Q2724302","display_name":"Abnormality","level":2,"score":0.42149999737739563},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3716000020503998},{"id":"https://openalex.org/C172367668","wikidata":"https://www.wikidata.org/wiki/Q6504956","display_name":"Data visualization","level":3,"score":0.34360000491142273},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.33390000462532043},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3301999866962433},{"id":"https://openalex.org/C14669888","wikidata":"https://www.wikidata.org/wiki/Q4014850","display_name":"Creative visualization","level":3,"score":0.30410000681877136},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.30219998955726624},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.2946000099182129},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.2840999960899353},{"id":"https://openalex.org/C16345878","wikidata":"https://www.wikidata.org/wiki/Q107472979","display_name":"Orientation (vector space)","level":2,"score":0.27070000767707825},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2500999867916107}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/robio66223.2025.11377666","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robio66223.2025.11377666","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Robotics and Biomimetics (ROBIO)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/2","score":0.7034068703651428,"display_name":"Zero hunger"}],"awards":[{"id":"https://openalex.org/G5191620234","display_name":null,"funder_award_id":"62273296","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1901129140","https://openalex.org/W2110764733","https://openalex.org/W2194775991","https://openalex.org/W2295107390","https://openalex.org/W2885318284","https://openalex.org/W3082624664","https://openalex.org/W3169077988","https://openalex.org/W4312289809","https://openalex.org/W4312772600","https://openalex.org/W4320497376","https://openalex.org/W4365814785","https://openalex.org/W4386065385","https://openalex.org/W4399179612","https://openalex.org/W4402703054","https://openalex.org/W4402917235","https://openalex.org/W4403257427","https://openalex.org/W4408609950"],"related_works":[],"abstract_inverted_index":{"The":[0],"growing":[1],"demand":[2],"for":[3,22,45,54,115,171],"early":[4],"detection":[5],"of":[6,31,68,140,163],"colorectal":[7],"diseases":[8],"has":[9,41],"led":[10],"to":[11,65,104,159],"increasing":[12],"interest":[13],"in":[14,61,166],"applying":[15],"vision-language":[16,164],"models":[17,165],"(VLMs),":[18],"such":[19,62],"as":[20],"CLIP,":[21],"automated":[23],"intestinal":[24,39,92,168],"abnormality":[25],"detection.":[26],"In":[27,76],"particular,":[28],"the":[29,66,121,138,161],"development":[30],"robotic":[32],"endoscopy":[33],"systems":[34,170],"including":[35],"capsule":[36],"and":[37,50,72,98,118,143,151],"soft":[38],"robots":[40],"created":[42],"new":[43],"opportunities":[44],"AI-assisted":[46],"diagnosis,":[47],"where":[48],"interpretability":[49,106],"reliability":[51],"are":[52],"critical":[53],"real-world":[55],"deployment.":[56],"However,":[57],"VLMs":[58],"remain":[59],"limited":[60],"scenarios":[63],"due":[64],"lack":[67],"fine-grained":[69],"annotated":[70,87],"datasets":[71],"transparent":[73],"decision-making":[74],"mechanisms.":[75],"this":[77],"work,":[78],"we":[79],"address":[80],"these":[81],"challenges":[82],"by":[83],"constructing":[84],"a":[85,100],"pixel-level":[86],"dataset":[88,111],"focused":[89],"on":[90,129],"common":[91],"abnormalities":[93],"(e.g.,":[94],"polyps,":[95],"bleeding,":[96],"inflammation),":[97],"designing":[99],"CLIP-guided":[101],"visualization":[102,122,144],"pipeline":[103],"enhance":[105],"during":[107],"model":[108,116],"inference.":[109],"Our":[110],"provides":[112,156],"high-quality":[113],"supervision":[114],"training":[117],"evaluation,":[119],"while":[120],"module":[123,145],"highlights":[124],"spatial":[125],"anomaly":[126],"regions":[127],"based":[128],"visual-textual":[130],"similarity.":[131],"Experiments":[132],"under":[133],"few-shot":[134],"settings":[135],"demonstrate":[136],"that":[137],"combination":[139],"our":[141],"annotations":[142],"significantly":[146],"improves":[147],"both":[148],"classification":[149],"performance":[150],"clinical":[152],"transparency.":[153],"This":[154],"work":[155],"foundational":[157],"tools":[158],"support":[160],"deployment":[162],"intelligent":[167],"robot":[169],"medical":[172],"diagnosis.":[173]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-02-24T00:00:00"}
