{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2025:5KNBKHIA77J3IB5QJRABDY5PH7","short_pith_number":"pith:5KNBKHIA","canonical_record":{"source":{"id":"2512.02182","kind":"arxiv","version":3},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"stat.ME","submitted_at":"2025-12-01T20:22:34Z","cross_cats_sorted":["stat.AP"],"title_canon_sha256":"b4ba8c88016f430fc9cfe8ee7b8329d79d9569edaef379a37a8f5cdbab12db5d","abstract_canon_sha256":"c0025addf96c3d21f44ac82ce3b275bd4b878dfaa1d93e07cdea7a7c37db6c14"},"schema_version":"1.0"},"canonical_sha256":"ea9a151d00ffd3b407b04c4011e3af3fd3d3df770cadff67f6fe3450c8ea3541","source":{"kind":"arxiv","id":"2512.02182","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2512.02182","created_at":"2026-05-21T01:04:19Z"},{"alias_kind":"arxiv_version","alias_value":"2512.02182v3","created_at":"2026-05-21T01:04:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2512.02182","created_at":"2026-05-21T01:04:19Z"},{"alias_kind":"pith_short_12","alias_value":"5KNBKHIA77J3","created_at":"2026-05-21T01:04:19Z"},{"alias_kind":"pith_short_16","alias_value":"5KNBKHIA77J3IB5Q","created_at":"2026-05-21T01:04:19Z"},{"alias_kind":"pith_short_8","alias_value":"5KNBKHIA","created_at":"2026-05-21T01:04:19Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2025:5KNBKHIA77J3IB5QJRABDY5PH7","target":"record","payload":{"canonical_record":{"source":{"id":"2512.02182","kind":"arxiv","version":3},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"stat.ME","submitted_at":"2025-12-01T20:22:34Z","cross_cats_sorted":["stat.AP"],"title_canon_sha256":"b4ba8c88016f430fc9cfe8ee7b8329d79d9569edaef379a37a8f5cdbab12db5d","abstract_canon_sha256":"c0025addf96c3d21f44ac82ce3b275bd4b878dfaa1d93e07cdea7a7c37db6c14"},"schema_version":"1.0"},"canonical_sha256":"ea9a151d00ffd3b407b04c4011e3af3fd3d3df770cadff67f6fe3450c8ea3541","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-21T01:04:19.378451Z","signature_b64":"aBOLF2L9ncUBz1aFiBQrFmi5aD/vayzIyGaikC5Vz/LZXSAp2tBf+l4JKFqzankgvk/XTyIzU+jkCGNCJBjIAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"ea9a151d00ffd3b407b04c4011e3af3fd3d3df770cadff67f6fe3450c8ea3541","last_reissued_at":"2026-05-21T01:04:19.377104Z","signature_status":"signed_v1","first_computed_at":"2026-05-21T01:04:19.377104Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2512.02182","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-21T01:04:19Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Yoc031EVwBHRpIrvurHMq8xnbhy3PcjDSsgwJGRuAlqiVVdhN6UkexxiXdRPeY6F+jdyvLCXITd02oqDqXTWBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-12T05:23:21.147714Z"},"content_sha256":"583fcebcb8528f90c1f8ab16bfa95d9303869b8573a2dbbd21ee2c766d428cf1","schema_version":"1.0","event_id":"sha256:583fcebcb8528f90c1f8ab16bfa95d9303869b8573a2dbbd21ee2c766d428cf1"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2025:5KNBKHIA77J3IB5QJRABDY5PH7","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Two-phase validation sampling via principal components to improve efficiency in multi-model estimation from error-prone biomedical databases","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["stat.AP"],"primary_cat":"stat.ME","authors_text":"Cole Manschot, Sarah C. Lotspeich","submitted_at":"2025-12-01T20:22:34Z","abstract_excerpt":"Two-phase sampling offers a cost-effective way to validate error-prone covariate measurements in biomedical databases. Inexpensive or easy-to-obtain information is collected for the entire study in Phase I. Then, a subset of patients undergoes cost-intensive validation (e.g., expert chart review) to collect more accurate data in Phase II. When balancing primary and secondary analyses, competing models and priorities can result in poorly defined objectives for the most informative Phase II sampling criterion. Extreme tail sampling (ETS), wherein patients with the smallest and largest values of "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2512.02182","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2512.02182/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-21T01:04:19Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"QASasU51wu24V3jn1o5i7uhVip0lnzGDV/QWEUZ93Tc82RZMuh5GcU+zevhJ4ZjMeQ8C76+HUwMJKpERIv88AA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-12T05:23:21.148092Z"},"content_sha256":"bbd32aed443ddc1d23f44964215ba434c6d80da1625b530dfbe63f32a33b05fb","schema_version":"1.0","event_id":"sha256:bbd32aed443ddc1d23f44964215ba434c6d80da1625b530dfbe63f32a33b05fb"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/5KNBKHIA77J3IB5QJRABDY5PH7/bundle.json","state_url":"https://pith.science/pith/5KNBKHIA77J3IB5QJRABDY5PH7/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/5KNBKHIA77J3IB5QJRABDY5PH7/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-12T05:23:21Z","links":{"resolver":"https://pith.science/pith/5KNBKHIA77J3IB5QJRABDY5PH7","bundle":"https://pith.science/pith/5KNBKHIA77J3IB5QJRABDY5PH7/bundle.json","state":"https://pith.science/pith/5KNBKHIA77J3IB5QJRABDY5PH7/state.json","well_known_bundle":"https://pith.science/.well-known/pith/5KNBKHIA77J3IB5QJRABDY5PH7/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:5KNBKHIA77J3IB5QJRABDY5PH7","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"c0025addf96c3d21f44ac82ce3b275bd4b878dfaa1d93e07cdea7a7c37db6c14","cross_cats_sorted":["stat.AP"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"stat.ME","submitted_at":"2025-12-01T20:22:34Z","title_canon_sha256":"b4ba8c88016f430fc9cfe8ee7b8329d79d9569edaef379a37a8f5cdbab12db5d"},"schema_version":"1.0","source":{"id":"2512.02182","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2512.02182","created_at":"2026-05-21T01:04:19Z"},{"alias_kind":"arxiv_version","alias_value":"2512.02182v3","created_at":"2026-05-21T01:04:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2512.02182","created_at":"2026-05-21T01:04:19Z"},{"alias_kind":"pith_short_12","alias_value":"5KNBKHIA77J3","created_at":"2026-05-21T01:04:19Z"},{"alias_kind":"pith_short_16","alias_value":"5KNBKHIA77J3IB5Q","created_at":"2026-05-21T01:04:19Z"},{"alias_kind":"pith_short_8","alias_value":"5KNBKHIA","created_at":"2026-05-21T01:04:19Z"}],"graph_snapshots":[{"event_id":"sha256:bbd32aed443ddc1d23f44964215ba434c6d80da1625b530dfbe63f32a33b05fb","target":"graph","created_at":"2026-05-21T01:04:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2512.02182/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Two-phase sampling offers a cost-effective way to validate error-prone covariate measurements in biomedical databases. Inexpensive or easy-to-obtain information is collected for the entire study in Phase I. Then, a subset of patients undergoes cost-intensive validation (e.g., expert chart review) to collect more accurate data in Phase II. When balancing primary and secondary analyses, competing models and priorities can result in poorly defined objectives for the most informative Phase II sampling criterion. Extreme tail sampling (ETS), wherein patients with the smallest and largest values of ","authors_text":"Cole Manschot, Sarah C. Lotspeich","cross_cats":["stat.AP"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"stat.ME","submitted_at":"2025-12-01T20:22:34Z","title":"Two-phase validation sampling via principal components to improve efficiency in multi-model estimation from error-prone biomedical databases"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2512.02182","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:583fcebcb8528f90c1f8ab16bfa95d9303869b8573a2dbbd21ee2c766d428cf1","target":"record","created_at":"2026-05-21T01:04:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"c0025addf96c3d21f44ac82ce3b275bd4b878dfaa1d93e07cdea7a7c37db6c14","cross_cats_sorted":["stat.AP"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"stat.ME","submitted_at":"2025-12-01T20:22:34Z","title_canon_sha256":"b4ba8c88016f430fc9cfe8ee7b8329d79d9569edaef379a37a8f5cdbab12db5d"},"schema_version":"1.0","source":{"id":"2512.02182","kind":"arxiv","version":3}},"canonical_sha256":"ea9a151d00ffd3b407b04c4011e3af3fd3d3df770cadff67f6fe3450c8ea3541","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"ea9a151d00ffd3b407b04c4011e3af3fd3d3df770cadff67f6fe3450c8ea3541","first_computed_at":"2026-05-21T01:04:19.377104Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-21T01:04:19.377104Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"aBOLF2L9ncUBz1aFiBQrFmi5aD/vayzIyGaikC5Vz/LZXSAp2tBf+l4JKFqzankgvk/XTyIzU+jkCGNCJBjIAw==","signature_status":"signed_v1","signed_at":"2026-05-21T01:04:19.378451Z","signed_message":"canonical_sha256_bytes"},"source_id":"2512.02182","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:583fcebcb8528f90c1f8ab16bfa95d9303869b8573a2dbbd21ee2c766d428cf1","sha256:bbd32aed443ddc1d23f44964215ba434c6d80da1625b530dfbe63f32a33b05fb"],"state_sha256":"a6029ef92f7890da3bad20a685970754c7d61c5d843d90242c734e0eb47e95c4"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"4CSPC1PZu6Nw74FeKKFql7SA+QlDLkQvXGXUurZ6nClo+rcmbvcPT6ww0WUsUTGYAXeoKBJLlPKJMPGy/G+GBA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-12T05:23:21.150321Z","bundle_sha256":"11289065f9b26e0fd5f0d1730372d0b3b82208add902ff6142be4f2a9bdea970"}}