{"id":"https://openalex.org/W7161568262","doi":"https://doi.org/10.48550/arxiv.2605.15383","title":"MorphoHELM: A Comprehensive Benchmark for Evaluating Representations for Microscopy-Based Morphology Assays","display_name":"MorphoHELM: A Comprehensive Benchmark for Evaluating Representations for Microscopy-Based Morphology Assays","publication_year":2026,"publication_date":"2026-05-14","ids":{"openalex":"https://openalex.org/W7161568262","doi":"https://doi.org/10.48550/arxiv.2605.15383"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.15383","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.15383","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.15383","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136378234","display_name":"Emre Hayir","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hayir, Emre","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123097120","display_name":"Lorin Crawford","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Crawford, Lorin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134023223","display_name":"Alex X. Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Alex X.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12874","display_name":"Digital Imaging for Blood Diseases","score":0.002199999988079071,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13114","display_name":"Image Processing Techniques and Applications","score":0.000699999975040555,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7753999829292297},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5304999947547913},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.46480000019073486},{"id":"https://openalex.org/keywords/profiling","display_name":"Profiling (computer programming)","score":0.42329999804496765},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.4138000011444092},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4117000102996826},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.39419999718666077},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.3917999863624573}],"concepts":[{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7753999829292297},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7739999890327454},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6373999714851379},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5640000104904175},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5304999947547913},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.46480000019073486},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4575999975204468},{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.42329999804496765},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4138000011444092},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4117000102996826},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.39419999718666077},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3917999863624573},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.366100013256073},{"id":"https://openalex.org/C116409475","wikidata":"https://www.wikidata.org/wiki/Q1385056","display_name":"External Data Representation","level":2,"score":0.33730000257492065},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.29919999837875366},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.29350000619888306},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.26600000262260437},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2621000111103058},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.2619999945163727},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.25540000200271606}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.15383","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.15383","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.15383","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.15383","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Microscopy":[0],"images":[1],"contain":[2],"rich":[3],"information":[4],"about":[5],"how":[6,143],"cells":[7],"respond":[8],"to":[9,14,69,106,118,148,161],"perturbations,":[10],"making":[11,66],"them":[12,105],"essential":[13],"applications":[15],"like":[16],"drug":[17],"screening.":[18],"To":[19],"quantify":[20],"images,":[21],"researchers":[22],"often":[23],"use":[24],"representation":[25],"extraction":[26,84],"methods,":[27,165],"and":[28,59,64,103,110,166,208],"recent":[29],"years":[30],"have":[31],"seen":[32],"a":[33,77],"proliferation":[34],"of":[35,43,116,123,135,146,176],"deep":[36],"learning":[37],"methods.":[38],"While":[39],"measuring":[40],"the":[41,89,100,113,124,144,200],"quality":[42],"these":[44,157],"representations":[45],"is":[46,126,130],"essential,":[47],"evaluation":[48,97,209],"remains":[49],"fragmented,":[50],"with":[51],"each":[52,128],"proposed":[53],"model":[54,188],"evaluated":[55,131],"on":[56,112],"different":[57,133],"tasks":[58],"datasets,":[60,206],"using":[61],"custom":[62],"pipelines":[63],"metrics,":[65],"it":[67],"difficult":[68],"fairly":[70],"compare":[71],"models.":[72],"Here,":[73],"we":[74,167],"introduce":[75],"MorphoHELM,":[76],"comprehensive":[78],"open":[79],"benchmark":[80,125],"for":[81,86],"evaluating":[82],"feature":[83,122],"methods":[85,117,147],"Cell":[87],"Painting,":[88],"most":[90],"widely-used":[91],"morphological":[92],"profiling":[93],"assay.":[94],"MorphoHELM":[95,160],"consolidates":[96],"standards":[98],"in":[99],"field,":[101],"extends":[102],"corrects":[104],"be":[107],"more":[108],"robust,":[109],"evaluates":[111],"widest":[114],"range":[115],"date.":[119],"A":[120],"defining":[121],"that":[127,169,171,185],"task":[129],"at":[132,173,181,214],"degrees":[134],"batch":[136],"effects":[137],"(or":[138],"technical":[139],"noise),":[140],"directly":[141],"quantifying":[142],"ability":[145],"detect":[149,162],"biological":[150,177],"signal":[151,178],"degrades":[152],"as":[153],"noise":[154],"increases.":[155],"Together,":[156],"properties":[158],"enable":[159],"trade-offs":[163],"between":[164],"demonstrate":[168],"models":[170],"excel":[172],"certain":[174],"kinds":[175],"are":[179,211],"weaker":[180],"others.":[182],"We":[183],"show":[184],"no":[186],"existing":[187],"outperforms":[189],"classic":[190],"computer":[191],"vision":[192],"analytic":[193],"strategies":[194],"across":[195],"all":[196],"settings,":[197],"which":[198],"remain":[199],"strongest":[201],"general":[202],"use-case":[203],"representations.":[204],"All":[205],"code,":[207],"tools":[210],"publicly":[212],"available":[213],"https://github.com/microsoft/MorphoHELM.":[215]},"counts_by_year":[],"updated_date":"2026-07-01T08:55:40.977307","created_date":"2026-05-19T00:00:00"}
