{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:WDFD5QSBM36SI7CNNSJBQSLI5R","short_pith_number":"pith:WDFD5QSB","schema_version":"1.0","canonical_sha256":"b0ca3ec24166fd247c4d6c92184968ec7ef35b6206372d91ddaeafde08bd3ca3","source":{"kind":"arxiv","id":"2605.15383","version":1},"attestation_state":"computed","paper":{"title":"MorphoHELM: A Comprehensive Benchmark for Evaluating Representations for Microscopy-Based Morphology Assays","license":"http://creativecommons.org/licenses/by/4.0/","headline":"No existing model outperforms classic computer vision analytic strategies across all settings for microscopy morphology representations.","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Alex X. Lu, Emre Hayir, Lorin Crawford","submitted_at":"2026-05-14T20:13:36Z","abstract_excerpt":"Microscopy images contain rich information about how cells respond to perturbations, making them essential to applications like drug screening. To quantify images, researchers often use representation extraction methods, and recent years have seen a proliferation of deep learning methods. While measuring the quality of these representations is essential, evaluation remains fragmented, with each proposed model evaluated on different tasks and datasets, using custom pipelines and metrics, making it difficult to fairly compare models. Here, we introduce MorphoHELM, a comprehensive open benchmark "},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":true,"formal_links_present":true},"canonical_record":{"source":{"id":"2605.15383","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-14T20:13:36Z","cross_cats_sorted":[],"title_canon_sha256":"e4aa93a82aacc71599ddae0072df1de920077f157588ac4f67b6f537e05d4de3","abstract_canon_sha256":"0fcb6a5de94a2c7a969f7fb2da14f1c8621c00a8c84fdefb5fdbb9ebc694500c"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:00:55.624794Z","signature_b64":"goz6LQ8lMRwNNzm6Fvwpb3dAxldmMfLgVjqrN3U4o1tadJfEjfnPpf6m6+JNqtVyejPNHxmlEKu92ichK+QtCA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b0ca3ec24166fd247c4d6c92184968ec7ef35b6206372d91ddaeafde08bd3ca3","last_reissued_at":"2026-05-20T00:00:55.623900Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:00:55.623900Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"MorphoHELM: A Comprehensive Benchmark for Evaluating Representations for Microscopy-Based Morphology Assays","license":"http://creativecommons.org/licenses/by/4.0/","headline":"No existing model outperforms classic computer vision analytic strategies across all settings for microscopy morphology representations.","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Alex X. Lu, Emre Hayir, Lorin Crawford","submitted_at":"2026-05-14T20:13:36Z","abstract_excerpt":"Microscopy images contain rich information about how cells respond to perturbations, making them essential to applications like drug screening. To quantify images, researchers often use representation extraction methods, and recent years have seen a proliferation of deep learning methods. While measuring the quality of these representations is essential, evaluation remains fragmented, with each proposed model evaluated on different tasks and datasets, using custom pipelines and metrics, making it difficult to fairly compare models. Here, we introduce MorphoHELM, a comprehensive open benchmark "},"claims":{"count":4,"items":[{"kind":"strongest_claim","text":"No existing model outperforms classic computer vision analytic strategies across all settings, which remain the strongest general use-case representations.","source":"verdict.strongest_claim","status":"machine_extracted","claim_id":"C1","attestation":"unclaimed"},{"kind":"weakest_assumption","text":"The selected tasks, metrics, and simulated batch effect levels accurately and comprehensively capture the ability of representations to detect true biological signals without introducing bias from the choice of evaluation standards or noise models.","source":"verdict.weakest_assumption","status":"machine_extracted","claim_id":"C2","attestation":"unclaimed"},{"kind":"one_line_summary","text":"MorphoHELM is a new benchmark for Cell Painting morphology representations that tests methods across increasing batch effect levels and finds classic computer vision strategies remain the strongest general-purpose performers.","source":"verdict.one_line_summary","status":"machine_extracted","claim_id":"C3","attestation":"unclaimed"},{"kind":"headline","text":"No existing model outperforms classic computer vision analytic strategies across all settings for microscopy morphology representations.","source":"verdict.pith_extraction.headline","status":"machine_extracted","claim_id":"C4","attestation":"unclaimed"}],"snapshot_sha256":"e0e1b88b0d6ceca1ff62e3d5e731210a0f6d2c143f85e3a1fa1410230d3dbad4"},"source":{"id":"2605.15383","kind":"arxiv","version":1},"verdict":{"id":"a4d45c3d-7fd0-4bf2-af3a-3fc34b594204","model_set":{"reader":"grok-4.3"},"created_at":"2026-05-19T15:42:44.492555Z","strongest_claim":"No existing model outperforms classic computer vision analytic strategies across all settings, which remain the strongest general use-case representations.","one_line_summary":"MorphoHELM is a new benchmark for Cell Painting morphology representations that tests methods across increasing batch effect levels and finds classic computer vision strategies remain the strongest general-purpose performers.","pipeline_version":"pith-pipeline@v0.9.0","weakest_assumption":"The selected tasks, metrics, and simulated batch effect levels accurately and comprehensively capture the ability of representations to detect true biological signals without introducing bias from the choice of evaluation standards or noise models.","pith_extraction_headline":"No existing model outperforms classic computer vision analytic strategies across all settings for microscopy morphology representations."},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.15383/integrity.json","findings":[],"available":true,"detectors_run":[{"name":"doi_title_agreement","ran_at":"2026-05-19T16:01:18.046510Z","status":"completed","version":"1.0.0","findings_count":0},{"name":"doi_compliance","ran_at":"2026-05-19T15:53:41.636383Z","status":"completed","version":"1.0.0","findings_count":0},{"name":"citation_quote_validity","ran_at":"2026-05-19T15:51:01.363590Z","status":"completed","version":"0.1.0","findings_count":0},{"name":"claim_evidence","ran_at":"2026-05-19T14:21:54.176534Z","status":"completed","version":"1.0.0","findings_count":0},{"name":"ai_meta_artifact","ran_at":"2026-05-19T13:33:22.728369Z","status":"skipped","version":"1.0.0","findings_count":0}],"snapshot_sha256":"f54117e870fbfd27dcc8aac821f61ffe3578fe76286cb62a613ae03502e8efeb"},"references":{"count":40,"sample":[{"doi":"10.1038/nprot.2016.105","year":2016,"title":"Cell Painting, a high-content image-based assay for morphological pro ﬁling using multiplexed ﬂuorescent dyes","work_id":"218e96e0-ddd8-4d2a-9fe7-b274d96e4355","ref_index":1,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"10.1038/s41592-024-02528-8","year":2024,"title":"Srijit Seal, Maria-Anna Trapotsi, Ola Spjuth, Shantanu Singh, Jordi Carreras-Puigvert, Nigel Greene, Andreas Bender, and Anne E. Carpenter. Cell painting: a decade of discovery and innovation in cellu","work_id":"19943a5c-9580-444e-8db0-8304bfcbc0d5","ref_index":2,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"10.1038/nmeth.4397","year":2017,"title":"Data-analysis strategies for image-based cell profiling","work_id":"c89a8677-2f80-4575-a900-d60aa9c019ae","ref_index":3,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"10.1016/j.coisb.2018.05.004","year":2018,"title":"Machine learning and image-ba sed proﬁl- ing in drug discovery","work_id":"10ab9388-e730-4898-b2fe-51cf4ad9dab3","ref_index":4,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"","year":2021,"title":"Image-based profiling for drug discovery: due for a machine-learning upgrade?Nat","work_id":"f22a9b8a-d0f4-4862-bd07-13cf04bb191a","ref_index":5,"cited_arxiv_id":"","is_internal_anchor":false}],"resolved_work":40,"snapshot_sha256":"f7723dca14c293b483bd2b4f17747a5e19f569b914c204fabd13774c0727356a","internal_anchors":1},"formal_canon":{"evidence_count":2,"snapshot_sha256":"9ec3fdb05715f501a84ad8b30173eba8ef2194d132709049b620027ec664ff32"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.15383","created_at":"2026-05-20T00:00:55.624022+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.15383v1","created_at":"2026-05-20T00:00:55.624022+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.15383","created_at":"2026-05-20T00:00:55.624022+00:00"},{"alias_kind":"pith_short_12","alias_value":"WDFD5QSBM36S","created_at":"2026-05-20T00:00:55.624022+00:00"},{"alias_kind":"pith_short_16","alias_value":"WDFD5QSBM36SI7CN","created_at":"2026-05-20T00:00:55.624022+00:00"},{"alias_kind":"pith_short_8","alias_value":"WDFD5QSB","created_at":"2026-05-20T00:00:55.624022+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":2,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/WDFD5QSBM36SI7CNNSJBQSLI5R","json":"https://pith.science/pith/WDFD5QSBM36SI7CNNSJBQSLI5R.json","graph_json":"https://pith.science/api/pith-number/WDFD5QSBM36SI7CNNSJBQSLI5R/graph.json","events_json":"https://pith.science/api/pith-number/WDFD5QSBM36SI7CNNSJBQSLI5R/events.json","paper":"https://pith.science/paper/WDFD5QSB"},"agent_actions":{"view_html":"https://pith.science/pith/WDFD5QSBM36SI7CNNSJBQSLI5R","download_json":"https://pith.science/pith/WDFD5QSBM36SI7CNNSJBQSLI5R.json","view_paper":"https://pith.science/paper/WDFD5QSB","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.15383&json=true","fetch_graph":"https://pith.science/api/pith-number/WDFD5QSBM36SI7CNNSJBQSLI5R/graph.json","fetch_events":"https://pith.science/api/pith-number/WDFD5QSBM36SI7CNNSJBQSLI5R/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/WDFD5QSBM36SI7CNNSJBQSLI5R/action/timestamp_anchor","attest_storage":"https://pith.science/pith/WDFD5QSBM36SI7CNNSJBQSLI5R/action/storage_attestation","attest_author":"https://pith.science/pith/WDFD5QSBM36SI7CNNSJBQSLI5R/action/author_attestation","sign_citation":"https://pith.science/pith/WDFD5QSBM36SI7CNNSJBQSLI5R/action/citation_signature","submit_replication":"https://pith.science/pith/WDFD5QSBM36SI7CNNSJBQSLI5R/action/replication_record"}},"created_at":"2026-05-20T00:00:55.624022+00:00","updated_at":"2026-05-20T00:00:55.624022+00:00"}