{"id":"https://openalex.org/W4403791333","doi":"https://doi.org/10.1145/3664647.3681529","title":"ReForm-Eval: Evaluating Large Vision Language Models via Unified Re-Formulation of Task-Oriented Benchmarks","display_name":"ReForm-Eval: Evaluating Large Vision Language Models via Unified Re-Formulation of Task-Oriented Benchmarks","publication_year":2024,"publication_date":"2024-10-26","ids":{"openalex":"https://openalex.org/W4403791333","doi":"https://doi.org/10.1145/3664647.3681529"},"language":"en","primary_location":{"id":"doi:10.1145/3664647.3681529","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3681529","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019514950","display_name":"Zejun Li","orcid":"https://orcid.org/0000-0002-7443-8027"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zejun Li","raw_affiliation_strings":["School of Data Science, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-7443-8027","affiliations":[{"raw_affiliation_string":"School of Data Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Ye Wang","orcid":"https://orcid.org/0009-0005-0062-3181"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ye Wang","raw_affiliation_strings":["Academy for Engineering and Technology, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0005-0062-3181","affiliations":[{"raw_affiliation_string":"Academy for Engineering and Technology, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019333214","display_name":"Mengfei Du","orcid":null},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mengfei Du","raw_affiliation_strings":["School of Data Science, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0009-3078-417X","affiliations":[{"raw_affiliation_string":"School of Data Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Qingwen Liu","orcid":"https://orcid.org/0009-0002-3161-5158"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]},{"id":"https://openalex.org/I4210085920","display_name":"Shanghai Institute for Science of Science","ror":"https://ror.org/004srxn73","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210085920"]},{"id":"https://openalex.org/I4210164150","display_name":"Shanghai Center for Brain Science and Brain-Inspired Technology","ror":"https://ror.org/0551a0y31","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210164150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qingwen Liu","raw_affiliation_strings":["Institute of Science and Technology for Brain-Inspired Intelligence, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0002-3161-5158","affiliations":[{"raw_affiliation_string":"Institute of Science and Technology for Brain-Inspired Intelligence, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I4210164150","https://openalex.org/I4210085920","https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113017223","display_name":"Binhao Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Binhao Wu","raw_affiliation_strings":["School of Data Science, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0007-4377-7679","affiliations":[{"raw_affiliation_string":"School of Data Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024632865","display_name":"Jiwen Zhang","orcid":"https://orcid.org/0000-0002-8060-6824"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiwen Zhang","raw_affiliation_strings":["School of Data Science, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-8060-6824","affiliations":[{"raw_affiliation_string":"School of Data Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005173239","display_name":"Chengxing Zhou","orcid":null},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chengxing Zhou","raw_affiliation_strings":["Software College, Northeastern University, Shenyang, Liaoning, China"],"raw_orcid":"https://orcid.org/0009-0006-8809-2422","affiliations":[{"raw_affiliation_string":"Software College, Northeastern University, Shenyang, Liaoning, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078689432","display_name":"Zhihao Fan","orcid":"https://orcid.org/0000-0002-9910-7937"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhihao Fan","raw_affiliation_strings":["Alibaba Group, Hangzhou, Zhejiang, China"],"raw_orcid":"https://orcid.org/0000-0002-9910-7937","affiliations":[{"raw_affiliation_string":"Alibaba Group, Hangzhou, Zhejiang, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101713885","display_name":"Jie Fu","orcid":"https://orcid.org/0000-0002-4494-843X"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Jie Fu","raw_affiliation_strings":["Department of Computer Science and Engineering, Hong Kong University of Science and Technology, Hong Kong, China"],"raw_orcid":"https://orcid.org/0000-0002-4494-843X","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Hong Kong University of Science and Technology, Hong Kong, China","institution_ids":["https://openalex.org/I200769079"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100373491","display_name":"Jingjing Chen","orcid":"https://orcid.org/0000-0003-1737-3420"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingjing Chen","raw_affiliation_strings":["School of Computer Science, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0003-1737-3420","affiliations":[{"raw_affiliation_string":"School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011504177","display_name":"Zhongyu Wei","orcid":"https://orcid.org/0000-0003-3789-8507"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhongyu Wei","raw_affiliation_strings":["School of Data Science, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0003-3789-8507","affiliations":[{"raw_affiliation_string":"School of Data Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088834359","display_name":"Xuanjing Huang","orcid":"https://orcid.org/0000-0001-9197-9426"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuanjing Huang","raw_affiliation_strings":["School of Computer Science, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0001-9197-9426","affiliations":[{"raw_affiliation_string":"School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5019514950"],"corresponding_institution_ids":["https://openalex.org/I24943067"],"apc_list":null,"apc_paid":null,"fwci":0.2381,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.53597412,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1971","last_page":"1980"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7721630930900574},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.658083438873291},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4523348808288574},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4515690505504608},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4388885498046875},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.41319432854652405},{"id":"https://openalex.org/keywords/systems-engineering","display_name":"Systems engineering","score":0.11024200916290283},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09920558333396912}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7721630930900574},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.658083438873291},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4523348808288574},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4515690505504608},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4388885498046875},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.41319432854652405},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.11024200916290283},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09920558333396912}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3664647.3681529","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3681529","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-148926","is_oa":false,"landing_page_url":"http://repository.hkust.edu.hk/ir/Record/1783.1-148926","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference paper"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W1971822075","https://openalex.org/W2049951199","https://openalex.org/W2185175083","https://openalex.org/W2187089797","https://openalex.org/W2277195237","https://openalex.org/W2489434015","https://openalex.org/W2533598788","https://openalex.org/W2560730294","https://openalex.org/W2597425697","https://openalex.org/W2886641317","https://openalex.org/W2963115613","https://openalex.org/W2963622213","https://openalex.org/W3177174258","https://openalex.org/W3198897329","https://openalex.org/W4225323055","https://openalex.org/W4287113019","https://openalex.org/W4287824540","https://openalex.org/W4296605665","https://openalex.org/W4313045695","https://openalex.org/W4381802186","https://openalex.org/W4383860112","https://openalex.org/W4385990846","https://openalex.org/W4403081466"],"related_works":["https://openalex.org/W2169518243","https://openalex.org/W4231937131","https://openalex.org/W3188962172","https://openalex.org/W4389443772","https://openalex.org/W323219885","https://openalex.org/W2063928587","https://openalex.org/W2772917594","https://openalex.org/W1487966966","https://openalex.org/W3204019825","https://openalex.org/W3098003361"],"abstract_inverted_index":{"Recent":[0],"years":[1],"have":[2,43],"witnessed":[3],"remarkable":[4],"progress":[5],"in":[6,120,130],"the":[7,16,39,64,73,78,124],"development":[8],"of":[9,41,68,113,128],"large":[10],"vision-language":[11],"models":[12],"(LVLMs).":[13],"Benefiting":[14],"from":[15],"strong":[17],"language":[18],"backbones":[19],"and":[20,33,47,76,100,118,126,136],"efficient":[21],"cross-modal":[22],"alignment":[23],"strategies,":[24],"LVLMs":[25,42],"exhibit":[26],"surprising":[27],"capabilities":[28,40,112],"to":[29,61,88],"perceive":[30],"visual":[31],"signals":[32],"perform":[34],"visually":[35],"grounded":[36],"reasoning.":[37],"However,":[38],"not":[44],"been":[45],"comprehensively":[46],"quantitatively":[48],"evaluated.":[49],"Most":[50],"existing":[51,90],"multi-modal":[52],"benchmarks":[53,91],"require":[54],"task-oriented":[55],"input-output":[56],"formats,":[57],"posing":[58],"great":[59],"challenges":[60],"automatically":[62],"assess":[63],"free-form":[65],"text":[66],"output":[67],"LVLMs.":[69,114,133],"To":[70],"effectively":[71],"leverage":[72],"annotations":[74],"available":[75,141],"reduce":[77],"manual":[79],"efforts":[80],"required":[81],"for":[82,109],"constructing":[83],"new":[84],"benchmarks,":[85],"we":[86,102,122],"propose":[87],"re-formulate":[89],"into":[92],"unified":[93],"LVLM-compatible":[94],"formats.":[95],"Through":[96,115],"systematic":[97],"data":[98,108],"collection":[99],"reformulation,":[101],"present":[103],"ReForm-Eval":[104,129],"benchmark,":[105],"offering":[106],"substantial":[107],"evaluating":[110],"various":[111,132],"extensive":[116],"experiments":[117],"analysis":[119],"ReForm-Eval,":[121],"demonstrate":[123],"comprehensiveness":[125],"reliability":[127],"assessing":[131],"Our":[134],"benchmark":[135],"evaluation":[137],"framework":[138],"is":[139],"now":[140],"at":[142],"https://github.com/FudanDISC/ReForm-Eval":[143]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
