{"id":"https://openalex.org/W4415539296","doi":"https://doi.org/10.1145/3746027.3758221","title":"PhysLab: A Benchmark Dataset for Multi-Granularity Visual Parsing of Physics Experiments","display_name":"PhysLab: A Benchmark Dataset for Multi-Granularity Visual Parsing of Physics Experiments","publication_year":2025,"publication_date":"2025-10-25","ids":{"openalex":"https://openalex.org/W4415539296","doi":"https://doi.org/10.1145/3746027.3758221"},"language":null,"primary_location":{"id":"doi:10.1145/3746027.3758221","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3758221","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5022701174","display_name":"Minghao Zou","orcid":"https://orcid.org/0000-0002-0239-3990"},"institutions":[{"id":"https://openalex.org/I79510175","display_name":"Cardiff University","ror":"https://ror.org/03kk7td41","country_code":"GB","type":"education","lineage":["https://openalex.org/I79510175"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Minghao Zou","raw_affiliation_strings":["Shandong University of Science and Technology, Qingdao, China and Cardiff University, Cardiff, United Kingdom"],"raw_orcid":"https://orcid.org/0000-0002-0239-3990","affiliations":[{"raw_affiliation_string":"Shandong University of Science and Technology, Qingdao, China and Cardiff University, Cardiff, United Kingdom","institution_ids":["https://openalex.org/I79510175"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003178957","display_name":"Qingtian Zeng","orcid":"https://orcid.org/0000-0002-6421-8223"},"institutions":[{"id":"https://openalex.org/I80143920","display_name":"Shandong University of Science and Technology","ror":"https://ror.org/04gtjhw98","country_code":"CN","type":"education","lineage":["https://openalex.org/I80143920"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qingtian Zeng","raw_affiliation_strings":["Shandong University of Science and Technology, Qingdao, China"],"raw_orcid":"https://orcid.org/0000-0002-6421-8223","affiliations":[{"raw_affiliation_string":"Shandong University of Science and Technology, Qingdao, China","institution_ids":["https://openalex.org/I80143920"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010947777","display_name":"Yongping Miao","orcid":null},"institutions":[{"id":"https://openalex.org/I80143920","display_name":"Shandong University of Science and Technology","ror":"https://ror.org/04gtjhw98","country_code":"CN","type":"education","lineage":["https://openalex.org/I80143920"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongping Miao","raw_affiliation_strings":["Shandong University of Science and Technology, Qingdao, China"],"raw_orcid":"https://orcid.org/0009-0002-7210-1938","affiliations":[{"raw_affiliation_string":"Shandong University of Science and Technology, Qingdao, China","institution_ids":["https://openalex.org/I80143920"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022821709","display_name":"Shangkun Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I80143920","display_name":"Shandong University of Science and Technology","ror":"https://ror.org/04gtjhw98","country_code":"CN","type":"education","lineage":["https://openalex.org/I80143920"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shangkun Liu","raw_affiliation_strings":["Shandong University of Science and Technology, Qingdao, China"],"raw_orcid":"https://orcid.org/0000-0001-5728-5092","affiliations":[{"raw_affiliation_string":"Shandong University of Science and Technology, Qingdao, China","institution_ids":["https://openalex.org/I80143920"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zilong Wang","orcid":"https://orcid.org/0009-0006-1876-0851"},"institutions":[{"id":"https://openalex.org/I80143920","display_name":"Shandong University of Science and Technology","ror":"https://ror.org/04gtjhw98","country_code":"CN","type":"education","lineage":["https://openalex.org/I80143920"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zilong Wang","raw_affiliation_strings":["Shandong University of Science and Technology, Qingdao, China"],"raw_orcid":"https://orcid.org/0009-0006-1876-0851","affiliations":[{"raw_affiliation_string":"Shandong University of Science and Technology, Qingdao, China","institution_ids":["https://openalex.org/I80143920"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101605853","display_name":"Hantao Liu","orcid":"https://orcid.org/0000-0003-4544-3481"},"institutions":[{"id":"https://openalex.org/I79510175","display_name":"Cardiff University","ror":"https://ror.org/03kk7td41","country_code":"GB","type":"education","lineage":["https://openalex.org/I79510175"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Hantao Liu","raw_affiliation_strings":["Cardiff University, Cardiff, United Kingdom"],"raw_orcid":"https://orcid.org/0000-0003-4544-3481","affiliations":[{"raw_affiliation_string":"Cardiff University, Cardiff, United Kingdom","institution_ids":["https://openalex.org/I79510175"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077250575","display_name":"Wei Zhou","orcid":"https://orcid.org/0000-0003-3641-1429"},"institutions":[{"id":"https://openalex.org/I79510175","display_name":"Cardiff University","ror":"https://ror.org/03kk7td41","country_code":"GB","type":"education","lineage":["https://openalex.org/I79510175"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Wei Zhou","raw_affiliation_strings":["Cardiff University, Cardiff, United Kingdom"],"raw_orcid":"https://orcid.org/0000-0003-3641-1429","affiliations":[{"raw_affiliation_string":"Cardiff University, Cardiff, United Kingdom","institution_ids":["https://openalex.org/I79510175"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.27380056,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"12799","last_page":"12806"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9886000156402588,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.7660999894142151},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.628600001335144},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6019999980926514},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.586899995803833},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5756000280380249},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5568000078201294},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.5472000241279602},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.4950999915599823}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7702000141143799},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.7660999894142151},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.628600001335144},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6019999980926514},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.586899995803833},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5756000280380249},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5568000078201294},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.5472000241279602},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.531499981880188},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4950999915599823},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4885999858379364},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.46560001373291016},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.42660000920295715},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.42309999465942383},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.4212000072002411},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.39500001072883606},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.3903999924659729},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3862999975681305},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.35179999470710754},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.3492000102996826},{"id":"https://openalex.org/C161301231","wikidata":"https://www.wikidata.org/wiki/Q3478658","display_name":"Knowledge representation and reasoning","level":2,"score":0.3391000032424927},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.33070001006126404},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.3118000030517578},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.28610000014305115},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2791999876499176},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.273499995470047},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.2619999945163727}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3746027.3758221","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3758221","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"},{"id":"pmh:oai:https://orca.cardiff.ac.uk:182178","is_oa":false,"landing_page_url":"https://orca.cardiff.ac.uk/view/cardiffauthors/A2188076Q.html>","pdf_url":null,"source":{"id":"https://openalex.org/S4306401195","display_name":"ORCA Online Research @Cardiff (Cardiff University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79510175","host_organization_name":"Cardiff University","host_organization_lineage":["https://openalex.org/I79510175"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"Conference or Workshop Item"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4353863251","display_name":null,"funder_award_id":"52374221","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4669388470","display_name":null,"funder_award_id":"2022ZD0119501","funder_id":"https://openalex.org/F4320335960","funder_display_name":"National Major Science and Technology Projects of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335960","display_name":"National Major Science and Technology Projects of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W2277195237","https://openalex.org/W2295288655","https://openalex.org/W2336403884","https://openalex.org/W3087464567","https://openalex.org/W3096563782","https://openalex.org/W4285004868","https://openalex.org/W4288083516","https://openalex.org/W4307838488","https://openalex.org/W4311121622","https://openalex.org/W4318475704","https://openalex.org/W4364375804","https://openalex.org/W4387917672","https://openalex.org/W4387969557","https://openalex.org/W4388430502","https://openalex.org/W4388579521","https://openalex.org/W4391216244","https://openalex.org/W4391248741","https://openalex.org/W4393081565","https://openalex.org/W4400075398","https://openalex.org/W4403791539","https://openalex.org/W4403791556"],"related_works":[],"abstract_inverted_index":{"Visual":[0],"parsing":[1,148],"of":[2,12,24,46,51,61,72,124,149],"images":[3],"and":[4,57,69,105,116,138,171,179,184],"videos":[5,115],"is":[6,20],"critical":[7],"for":[8,35,54,162],"a":[9,40,49,59,73,122,159],"wide":[10],"range":[11],"real-world":[13],"applications.":[14],"However,":[15],"progress":[16],"in":[17,146],"this":[18],"field":[19],"constrained":[21],"by":[22],"limitations":[23],"existing":[25],"datasets:":[26],"(1)":[27],"limited":[28],"annotation":[29],"diversity,":[30],"which":[31],"limits":[32],"the":[33,84,147,185],"support":[34,121],"diverse":[36,102],"vision":[37,125],"tasks":[38],"within":[39],"unified":[41],"dataset;":[42],"(2)":[43],"insufficient":[44,70],"coverage":[45],"domains,":[47],"particularly":[48],"lack":[50,60],"datasets":[52],"tailored":[53],"educational":[55,151,180],"scenarios;":[56],"(3)":[58],"explicit":[62],"procedural":[63,150],"guidance,":[64],"with":[65],"weak":[66],"logical":[67],"rules":[68],"representation":[71],"structured":[74],"task":[75],"process.":[76],"To":[77],"address":[78],"these":[79],"gaps,":[80],"we":[81],"introduce":[82],"PhysLab,":[83],"first":[85],"dataset":[86,95,183],"that":[87,100,120],"captures":[88],"students":[89],"conducting":[90],"complex":[91],"physics":[92],"experiments.":[93],"The":[94,182],"includes":[96],"four":[97],"representative":[98],"experiments":[99],"feature":[101],"scientific":[103],"instruments":[104],"rich":[106],"human-object":[107],"interaction":[108],"(HOI)":[109],"patterns.":[110],"PhysLab":[111,155],"comprises":[112],"620":[113],"long-form":[114],"provides":[117],"multi-granularity":[118],"annotations":[119],"variety":[123],"tasks,":[126],"including":[127],"action":[128],"recognition,":[129],"object":[130],"detection,":[131],"HOI":[132],"analysis,":[133],"etc.":[134],"We":[135,153],"establish":[136],"baselines":[137],"perform":[139],"extensive":[140],"evaluations":[141],"to":[142,156],"highlight":[143],"key":[144],"challenges":[145],"videos.":[152],"expect":[154],"serve":[157],"as":[158],"valuable":[160],"resource":[161],"advancing":[163],"comprehensive":[164],"visual":[165],"parsing,":[166],"facilitating":[167],"intelligent":[168],"classroom":[169],"systems,":[170],"fostering":[172],"closer":[173],"integration":[174],"among":[175],"computer":[176],"vision,":[177],"multimedia,":[178],"technologies.":[181],"evaluation":[186],"toolkit":[187],"are":[188],"publicly":[189],"available":[190],"at":[191],"https://github.com/ZMH-SDUST/PhysLab.":[192]},"counts_by_year":[],"updated_date":"2026-07-02T09:51:11.867554","created_date":"2025-10-25T00:00:00"}
