{"id":"https://openalex.org/W4402952971","doi":"https://doi.org/10.48550/arxiv.2409.00045","title":"PolypDB: A Curated Multi-Center Dataset for Development of AI Algorithms in Colonoscopy","display_name":"PolypDB: A Curated Multi-Center Dataset for Development of AI Algorithms in Colonoscopy","publication_year":2024,"publication_date":"2024-08-19","ids":{"openalex":"https://openalex.org/W4402952971","doi":"https://doi.org/10.48550/arxiv.2409.00045"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2409.00045","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.00045","pdf_url":"https://arxiv.org/pdf/2409.00045","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2409.00045","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5044673103","display_name":"Debesh Jha","orcid":"https://orcid.org/0000-0002-8078-6730"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jha, Debesh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076182848","display_name":"Nikhil Kumar Tomar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tomar, Nikhil Kumar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043592090","display_name":"Vanshali Sharma","orcid":"https://orcid.org/0000-0003-0008-1579"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sharma, Vanshali","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025256654","display_name":"Quoc-Huy Trinh","orcid":"https://orcid.org/0000-0002-7205-3211"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Trinh, Quoc-Huy","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010852509","display_name":"Koushik Biswas","orcid":"https://orcid.org/0000-0002-9818-8966"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Biswas, Koushik","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007142636","display_name":"Hongyi Pan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan, Hongyi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101837028","display_name":"Ritika K. Jha","orcid":"https://orcid.org/0009-0001-6489-909X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jha, Ritika K.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033826718","display_name":"G\u00f6rkem Durak","orcid":"https://orcid.org/0000-0002-1608-1955"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Durak, Gorkem","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051168420","display_name":"Alexander Hann","orcid":"https://orcid.org/0000-0001-8035-3559"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hann, Alexander","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042297343","display_name":"Jonas Varkey","orcid":"https://orcid.org/0000-0002-3499-7051"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Varkey, Jonas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081957303","display_name":"Hang Viet Dao","orcid":"https://orcid.org/0000-0002-3685-9496"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dao, Hang Viet","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077829431","display_name":"Long Van Dao","orcid":"https://orcid.org/0000-0002-7162-9557"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Van Dao, Long","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070089702","display_name":"Binh Phuc Nguyen","orcid":"https://orcid.org/0000-0002-3572-9235"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nguyen, Binh Phuc","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029325201","display_name":"Nikolaos Papachrysos","orcid":"https://orcid.org/0000-0002-2372-2554"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Papachrysos, Nikolaos","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066246680","display_name":"Brandon Rieders","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rieders, Brandon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004429568","display_name":"Peter T. Schmidt","orcid":"https://orcid.org/0000-0001-8338-5468"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Schmidt, Peter Thelin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113407763","display_name":"Enrik Geissler","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Geissler, Enrik","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088236048","display_name":"Tyler M. Berzin","orcid":"https://orcid.org/0000-0002-4364-6210"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Berzin, Tyler","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088962741","display_name":"P\u00e5l Halvorsen","orcid":"https://orcid.org/0000-0003-2073-7029"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Halvorsen, P\u00e5l","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102968267","display_name":"Michael A. Riegler","orcid":"https://orcid.org/0000-0002-3153-2064"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Riegler, Michael A.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081724732","display_name":"Thomas de Lange","orcid":"https://orcid.org/0000-0003-3989-7487"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"de Lange, Thomas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5030188696","display_name":"Ula\u015f Ba\u011fc\u0131","orcid":"https://orcid.org/0000-0001-7379-6829"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bagci, Ulas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":22,"corresponding_author_ids":["https://openalex.org/A5044673103"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10552","display_name":"Colorectal Cancer Screening and Detection","score":0.9814000129699707,"subfield":{"id":"https://openalex.org/subfields/2730","display_name":"Oncology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T10552","display_name":"Colorectal Cancer Screening and Detection","score":0.9814000129699707,"subfield":{"id":"https://openalex.org/subfields/2730","display_name":"Oncology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T12422","display_name":"Radiomics and Machine Learning in Medical Imaging","score":0.9782000184059143,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.593524158000946},{"id":"https://openalex.org/keywords/center","display_name":"Center (category theory)","score":0.559953510761261},{"id":"https://openalex.org/keywords/colonoscopy","display_name":"Colonoscopy","score":0.5224674940109253},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.42908263206481934},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.33335864543914795},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.1492367684841156},{"id":"https://openalex.org/keywords/internal-medicine","display_name":"Internal medicine","score":0.06545200943946838},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.051127612590789795},{"id":"https://openalex.org/keywords/crystallography","display_name":"Crystallography","score":0.0419880747795105}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.593524158000946},{"id":"https://openalex.org/C2779463800","wikidata":"https://www.wikidata.org/wiki/Q5062222","display_name":"Center (category theory)","level":2,"score":0.559953510761261},{"id":"https://openalex.org/C2778435480","wikidata":"https://www.wikidata.org/wiki/Q840387","display_name":"Colonoscopy","level":4,"score":0.5224674940109253},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42908263206481934},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.33335864543914795},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.1492367684841156},{"id":"https://openalex.org/C126322002","wikidata":"https://www.wikidata.org/wiki/Q11180","display_name":"Internal medicine","level":1,"score":0.06545200943946838},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.051127612590789795},{"id":"https://openalex.org/C8010536","wikidata":"https://www.wikidata.org/wiki/Q160398","display_name":"Crystallography","level":1,"score":0.0419880747795105},{"id":"https://openalex.org/C526805850","wikidata":"https://www.wikidata.org/wiki/Q188874","display_name":"Colorectal cancer","level":3,"score":0.0},{"id":"https://openalex.org/C121608353","wikidata":"https://www.wikidata.org/wiki/Q12078","display_name":"Cancer","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2409.00045","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.00045","pdf_url":"https://arxiv.org/pdf/2409.00045","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2409.00045","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2409.00045","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2409.00045","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.00045","pdf_url":"https://arxiv.org/pdf/2409.00045","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2381279477","https://openalex.org/W3016587774","https://openalex.org/W2999920852","https://openalex.org/W3028983594","https://openalex.org/W2363227174","https://openalex.org/W3211062742","https://openalex.org/W4318274204","https://openalex.org/W2073857279"],"abstract_inverted_index":{"Colonoscopy":[0],"is":[1,157],"the":[2,18,25,29,46,50,168],"primary":[3],"method":[4],"for":[5,67,71],"examination,":[6],"detection,":[7,171],"and":[8,24,64,74,91,123,135,144,153,159,175],"removal":[9],"of":[10,28,48,57,59],"polyps.":[11],"However,":[12],"challenges":[13],"such":[14],"as":[15],"variations":[16],"among":[17],"endoscopists'":[19],"skills,":[20],"bowel":[21],"quality":[22],"preparation,":[23],"complex":[26],"nature":[27],"large":[30,63,80],"intestine":[31],"contribute":[32],"to":[33],"high":[34],"polyp":[35,72,89],"miss-rate.":[36],"These":[37],"missed":[38],"polyps":[39],"can":[40,160,178],"develop":[41],"into":[42],"cancer":[43],"later,":[44],"underscoring":[45],"importance":[47],"improving":[49],"detection":[51,73,154],"methods.":[52],"To":[53],"address":[54],"this":[55],"gap":[56],"lack":[58],"publicly":[60,82],"available,":[61],"multi-center":[62],"diverse":[65],"datasets":[66],"developing":[68],"automatic":[69],"methods":[70],"segmentation,":[75,170],"we":[76],"introduce":[77],"PolypDB,":[78],"a":[79,139],"scale":[81],"available":[83],"dataset":[84],"that":[85],"contains":[86],"3934":[87],"still":[88],"images":[90,102],"their":[92],"corresponding":[93],"ground":[94],"truth":[95],"from":[96,103,128],"real":[97],"colonoscopy":[98],"videos.":[99],"PolypDB":[100,156],"comprises":[101],"five":[104],"modalities:":[105],"Blue":[106],"Light":[107,125],"Imaging":[108,111,117,121,126],"(BLI),":[109],"Flexible":[110],"Color":[112,116],"Enhancement":[113],"(FICE),":[114],"Linked":[115],"(LCI),":[118],"Narrow":[119],"Band":[120],"(NBI),":[122],"White":[124],"(WLI)":[127],"three":[129],"medical":[130],"centers":[131],"in":[132],"Norway,":[133],"Sweden,":[134],"Vietnam.":[136],"We":[137],"provide":[138],"benchmark":[140,174],"on":[141],"each":[142],"modality":[143],"center,":[145],"including":[146],"federated":[147,172],"learning":[148,173],"settings":[149],"using":[150],"popular":[151],"segmentation":[152],"benchmarks.":[155],"public":[158],"be":[161,179],"downloaded":[162],"at":[163,181],"\\url{https://osf.io/pr7ms/}.":[164],"More":[165],"information":[166],"about":[167],"dataset,":[169],"train-test":[176],"split":[177],"found":[180],"\\url{https://github.com/DebeshJha/PolypDB}.":[182]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1}],"updated_date":"2026-05-10T08:33:47.465468","created_date":"2025-10-10T00:00:00"}
