{"id":"https://openalex.org/W7131110556","doi":"https://doi.org/10.1109/iccvw69036.2025.00135","title":"PMC-Vid: A Large-Scale Biomedical Video Captioning Dataset","display_name":"PMC-Vid: A Large-Scale Biomedical Video Captioning Dataset","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W7131110556","doi":"https://doi.org/10.1109/iccvw69036.2025.00135"},"language":null,"primary_location":{"id":"doi:10.1109/iccvw69036.2025.00135","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccvw69036.2025.00135","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision Workshops (ICCVW)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019191233","display_name":"Yosuke Yamagishi","orcid":"https://orcid.org/0009-0006-7688-3075"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yosuke Yamagishi","raw_affiliation_strings":["The University of Tokyo"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The University of Tokyo","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101463446","display_name":"Kuniaki Saito","orcid":"https://orcid.org/0000-0001-9446-5068"},"institutions":[{"id":"https://openalex.org/I146230289","display_name":"Omron (Japan)","ror":"https://ror.org/00q0w1h45","country_code":"JP","type":"company","lineage":["https://openalex.org/I146230289"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kuniaki Saito","raw_affiliation_strings":["OMRON SINIC X Corporation"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"OMRON SINIC X Corporation","institution_ids":["https://openalex.org/I146230289"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126637302","display_name":"Atsushi Hashimoto","orcid":null},"institutions":[{"id":"https://openalex.org/I146230289","display_name":"Omron (Japan)","ror":"https://ror.org/00q0w1h45","country_code":"JP","type":"company","lineage":["https://openalex.org/I146230289"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Atsushi Hashimoto","raw_affiliation_strings":["OMRON SINIC X Corporation"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"OMRON SINIC X Corporation","institution_ids":["https://openalex.org/I146230289"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5126649672","display_name":"Yoshitaka Ushiku","orcid":null},"institutions":[{"id":"https://openalex.org/I146230289","display_name":"Omron (Japan)","ror":"https://ror.org/00q0w1h45","country_code":"JP","type":"company","lineage":["https://openalex.org/I146230289"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yoshitaka Ushiku","raw_affiliation_strings":["OMRON SINIC X Corporation"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"OMRON SINIC X Corporation","institution_ids":["https://openalex.org/I146230289"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.65511556,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1265","last_page":"1275"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.7986000180244446,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.7986000180244446,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.10679999738931656,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.025299999862909317,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.8611000180244446},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.7372000217437744},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.620199978351593},{"id":"https://openalex.org/keywords/domain-adaptation","display_name":"Domain adaptation","score":0.5440000295639038},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.47290000319480896},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.46970000863075256}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.8611000180244446},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.821399986743927},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.7372000217437744},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.620199978351593},{"id":"https://openalex.org/C2776434776","wikidata":"https://www.wikidata.org/wiki/Q19246213","display_name":"Domain adaptation","level":3,"score":0.5440000295639038},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.47290000319480896},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.46970000863075256},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3871999979019165},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.36719998717308044},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.36160001158714294},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.35760000348091125},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.34299999475479126},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.335099995136261},{"id":"https://openalex.org/C2983174267","wikidata":"https://www.wikidata.org/wiki/Q3775098","display_name":"Video retrieval","level":2,"score":0.28139999508857727},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.26420000195503235}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iccvw69036.2025.00135","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccvw69036.2025.00135","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision Workshops (ICCVW)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8738369156","display_name":null,"funder_award_id":"JPMJMS2236","funder_id":"https://openalex.org/F4320338247","funder_display_name":"Moonshot Research and Development Program"}],"funders":[{"id":"https://openalex.org/F4320338247","display_name":"Moonshot Research and Development Program","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W1601567445","https://openalex.org/W2065455422","https://openalex.org/W2101105183","https://openalex.org/W2113876684","https://openalex.org/W2142900973","https://openalex.org/W2152984213","https://openalex.org/W2425121537","https://openalex.org/W2801206142","https://openalex.org/W2889418103","https://openalex.org/W2950070192","https://openalex.org/W2950470654","https://openalex.org/W2952132648","https://openalex.org/W2963916161","https://openalex.org/W2964101993","https://openalex.org/W2989322838","https://openalex.org/W3009448441","https://openalex.org/W3013601028","https://openalex.org/W3046408530","https://openalex.org/W3086274320","https://openalex.org/W3106697459","https://openalex.org/W4360600216","https://openalex.org/W4385682555","https://openalex.org/W4386066385","https://openalex.org/W4387211014","https://openalex.org/W4387225661","https://openalex.org/W4389519587","https://openalex.org/W4392172801","https://openalex.org/W4398157498","https://openalex.org/W4398201291","https://openalex.org/W4399567248","https://openalex.org/W4402713111","https://openalex.org/W4402727142","https://openalex.org/W4403650369","https://openalex.org/W4404143589","https://openalex.org/W4405669265","https://openalex.org/W4405673884","https://openalex.org/W4408190450","https://openalex.org/W4413146669","https://openalex.org/W4413259085","https://openalex.org/W4415798317"],"related_works":[],"abstract_inverted_index":{"Video":[0],"understanding":[1],"in":[2,55,65,129],"the":[3,32],"biomedical":[4,34,67,93,130],"domain":[5,27,59,124,147],"presents":[6],"unique":[7],"challenges":[8,128],"due":[9],"to":[10,38,150],"specialized":[11,66,154],"visual":[12],"content":[13,117],"and":[14,58,78,103,146,156],"technical":[15],"terminology,":[16],"yet":[17],"existing":[18,53,111],"multimodal":[19],"models":[20,90,113],"have":[21],"been":[22],"primarily":[23],"evaluated":[24],"on":[25,122,153],"general":[26,123],"benchmarks.":[28],"We":[29],"introduce":[30],"PMC-Vid,":[31],"largest":[33],"video":[35,68,131],"captioning":[36],"dataset":[37,50,73,160],"date,":[39],"containing":[40],"over":[41],"77,000":[42],"video-caption":[43],"pairs":[44],"extracted":[45],"from":[46],"PubMed":[47],"Central.":[48],"This":[49],"significantly":[51],"surpasses":[52],"resources":[54],"both":[56],"scale":[57],"coverage,":[60],"filling":[61],"a":[62,72,82],"critical":[63],"gap":[64],"understanding.":[69,132],"PMC-Vid":[70],"features":[71],"curated":[74],"through":[75],"LLM-assisted":[76],"annotation":[77],"subsequently":[79],"verified":[80],"by":[81],"medical":[83,155],"doctor,":[84],"enabling":[85],"reliable":[86],"evaluation":[87],"of":[88],"video-language":[89,138],"across":[91],"diverse":[92],"domains":[94],"such":[95],"as":[96],"molecular":[97],"biology,":[98,100],"structural":[99],"clinical":[101],"medicine,":[102],"surgical":[104],"procedures.":[105],"Our":[106],"experimental":[107],"validation":[108],"demonstrates":[109],"that":[110],"vision-language":[112],"struggle":[114],"with":[115],"domain-specific":[116],"despite":[118],"their":[119],"strong":[120],"performance":[121,152],"tasks,":[125],"highlighting":[126],"specific":[127],"Through":[133],"baseline":[134],"implementations":[135],"using":[136],"state-of-the-art":[137],"models,":[139],"we":[140],"provide":[141],"insights":[142],"for":[143],"future":[144],"research":[145],"adaptation":[148],"techniques":[149],"improve":[151],"biological":[157],"content.":[158],"The":[159],"is":[161],"available":[162],"at":[163],"https://huggingface.co/datasets/omron-sinicx/PMC-Vid.":[164]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-02-24T00:00:00"}
