{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2014:IOITODY3FCCELK7G3RWYIHZZJK","short_pith_number":"pith:IOITODY3","canonical_record":{"source":{"id":"1403.3414","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"q-bio.GN","submitted_at":"2014-03-13T20:05:45Z","cross_cats_sorted":["math.ST","q-bio.PE","stat.TH"],"title_canon_sha256":"01a1e5a3517bbcd42922e1a5dd6c911d5433c165e077e6426b8aef777e76dccd","abstract_canon_sha256":"68fa5184defc6b39e7cbc662875b5bd68ee336890a300eb670b4eca7d465a989"},"schema_version":"1.0"},"canonical_sha256":"4391370f1b288445abe6dc6d841f394a89929ed83fef4fd4bf18ffe965e3759d","source":{"kind":"arxiv","id":"1403.3414","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1403.3414","created_at":"2026-05-18T02:56:20Z"},{"alias_kind":"arxiv_version","alias_value":"1403.3414v1","created_at":"2026-05-18T02:56:20Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1403.3414","created_at":"2026-05-18T02:56:20Z"},{"alias_kind":"pith_short_12","alias_value":"IOITODY3FCCE","created_at":"2026-05-18T12:28:33Z"},{"alias_kind":"pith_short_16","alias_value":"IOITODY3FCCELK7G","created_at":"2026-05-18T12:28:33Z"},{"alias_kind":"pith_short_8","alias_value":"IOITODY3","created_at":"2026-05-18T12:28:33Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2014:IOITODY3FCCELK7G3RWYIHZZJK","target":"record","payload":{"canonical_record":{"source":{"id":"1403.3414","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"q-bio.GN","submitted_at":"2014-03-13T20:05:45Z","cross_cats_sorted":["math.ST","q-bio.PE","stat.TH"],"title_canon_sha256":"01a1e5a3517bbcd42922e1a5dd6c911d5433c165e077e6426b8aef777e76dccd","abstract_canon_sha256":"68fa5184defc6b39e7cbc662875b5bd68ee336890a300eb670b4eca7d465a989"},"schema_version":"1.0"},"canonical_sha256":"4391370f1b288445abe6dc6d841f394a89929ed83fef4fd4bf18ffe965e3759d","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T02:56:20.523498Z","signature_b64":"plv3wMBIAXugxf/PpUGI1uuDyMyeErzMikgQErcbvarkQ6103x8/6+kUBjidI2rp2kIXq/8Tc0c9izeP63AuBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"4391370f1b288445abe6dc6d841f394a89929ed83fef4fd4bf18ffe965e3759d","last_reissued_at":"2026-05-18T02:56:20.522819Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T02:56:20.522819Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1403.3414","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:56:20Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"/orqRbLVjqBDQPPR2WQyBAHiZkkVTaptMK1dCk99GZeM3j5s6QBcjImGUYsO2Im++5mO+im1/fd9vVYpdZ4mAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-04T22:19:51.939626Z"},"content_sha256":"fb6f0bc3619f2f0deb8328c599fb346bad2d0532d1769c3013868d2cba923844","schema_version":"1.0","event_id":"sha256:fb6f0bc3619f2f0deb8328c599fb346bad2d0532d1769c3013868d2cba923844"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2014:IOITODY3FCCELK7G3RWYIHZZJK","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Predicting discovery rates of genomic features","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["math.ST","q-bio.PE","stat.TH"],"primary_cat":"q-bio.GN","authors_text":"NHLBI GO Exome Sequencing Project, Simon Gravel","submitted_at":"2014-03-13T20:05:45Z","abstract_excerpt":"Successful sequencing experiments require judicious sample selection. However, this selection must often be performed on the basis of limited preliminary data. Predicting the statistical properties of the final sample based on preliminary data can be challenging, because numerous uncertain model assumptions may be involved. Here, we ask whether we can predict ``omics\" variation across many samples by sequencing only a fraction of them. In the infinite-genome limit, we find that a pilot study sequencing $5\\%$ of a population is sufficient to predict the number of genetic variants in the entire "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1403.3414","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:56:20Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"dirC1R9RiwGndrnEFqKGDdZEPP/T9n438oDmiD0lA6ZLtXcXLLROvAyLtSswUDru196snaplOkiKLJaNpTmJBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-04T22:19:51.940203Z"},"content_sha256":"80e117e93dea60205051c0605a487098b16d8af073ca2267cec9be9990ab08be","schema_version":"1.0","event_id":"sha256:80e117e93dea60205051c0605a487098b16d8af073ca2267cec9be9990ab08be"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/IOITODY3FCCELK7G3RWYIHZZJK/bundle.json","state_url":"https://pith.science/pith/IOITODY3FCCELK7G3RWYIHZZJK/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/IOITODY3FCCELK7G3RWYIHZZJK/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-04T22:19:51Z","links":{"resolver":"https://pith.science/pith/IOITODY3FCCELK7G3RWYIHZZJK","bundle":"https://pith.science/pith/IOITODY3FCCELK7G3RWYIHZZJK/bundle.json","state":"https://pith.science/pith/IOITODY3FCCELK7G3RWYIHZZJK/state.json","well_known_bundle":"https://pith.science/.well-known/pith/IOITODY3FCCELK7G3RWYIHZZJK/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2014:IOITODY3FCCELK7G3RWYIHZZJK","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"68fa5184defc6b39e7cbc662875b5bd68ee336890a300eb670b4eca7d465a989","cross_cats_sorted":["math.ST","q-bio.PE","stat.TH"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"q-bio.GN","submitted_at":"2014-03-13T20:05:45Z","title_canon_sha256":"01a1e5a3517bbcd42922e1a5dd6c911d5433c165e077e6426b8aef777e76dccd"},"schema_version":"1.0","source":{"id":"1403.3414","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1403.3414","created_at":"2026-05-18T02:56:20Z"},{"alias_kind":"arxiv_version","alias_value":"1403.3414v1","created_at":"2026-05-18T02:56:20Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1403.3414","created_at":"2026-05-18T02:56:20Z"},{"alias_kind":"pith_short_12","alias_value":"IOITODY3FCCE","created_at":"2026-05-18T12:28:33Z"},{"alias_kind":"pith_short_16","alias_value":"IOITODY3FCCELK7G","created_at":"2026-05-18T12:28:33Z"},{"alias_kind":"pith_short_8","alias_value":"IOITODY3","created_at":"2026-05-18T12:28:33Z"}],"graph_snapshots":[{"event_id":"sha256:80e117e93dea60205051c0605a487098b16d8af073ca2267cec9be9990ab08be","target":"graph","created_at":"2026-05-18T02:56:20Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Successful sequencing experiments require judicious sample selection. However, this selection must often be performed on the basis of limited preliminary data. Predicting the statistical properties of the final sample based on preliminary data can be challenging, because numerous uncertain model assumptions may be involved. Here, we ask whether we can predict ``omics\" variation across many samples by sequencing only a fraction of them. In the infinite-genome limit, we find that a pilot study sequencing $5\\%$ of a population is sufficient to predict the number of genetic variants in the entire ","authors_text":"NHLBI GO Exome Sequencing Project, Simon Gravel","cross_cats":["math.ST","q-bio.PE","stat.TH"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"q-bio.GN","submitted_at":"2014-03-13T20:05:45Z","title":"Predicting discovery rates of genomic features"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1403.3414","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:fb6f0bc3619f2f0deb8328c599fb346bad2d0532d1769c3013868d2cba923844","target":"record","created_at":"2026-05-18T02:56:20Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"68fa5184defc6b39e7cbc662875b5bd68ee336890a300eb670b4eca7d465a989","cross_cats_sorted":["math.ST","q-bio.PE","stat.TH"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"q-bio.GN","submitted_at":"2014-03-13T20:05:45Z","title_canon_sha256":"01a1e5a3517bbcd42922e1a5dd6c911d5433c165e077e6426b8aef777e76dccd"},"schema_version":"1.0","source":{"id":"1403.3414","kind":"arxiv","version":1}},"canonical_sha256":"4391370f1b288445abe6dc6d841f394a89929ed83fef4fd4bf18ffe965e3759d","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"4391370f1b288445abe6dc6d841f394a89929ed83fef4fd4bf18ffe965e3759d","first_computed_at":"2026-05-18T02:56:20.522819Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T02:56:20.522819Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"plv3wMBIAXugxf/PpUGI1uuDyMyeErzMikgQErcbvarkQ6103x8/6+kUBjidI2rp2kIXq/8Tc0c9izeP63AuBQ==","signature_status":"signed_v1","signed_at":"2026-05-18T02:56:20.523498Z","signed_message":"canonical_sha256_bytes"},"source_id":"1403.3414","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:fb6f0bc3619f2f0deb8328c599fb346bad2d0532d1769c3013868d2cba923844","sha256:80e117e93dea60205051c0605a487098b16d8af073ca2267cec9be9990ab08be"],"state_sha256":"5f23078443382800ea55bb0b188e24c6a58968ca9c77f68668726bd3bdb6be2e"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"xiNzmkbTbdFOjt45JYV9LI/gZ4ZhwDeVyC6OtUv9J5lx5nBaNzWhTeiBvcpvlSS63maHc/fRUg5n7aMqB+vCBQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-04T22:19:51.943193Z","bundle_sha256":"ced7de45f76d4b5e03e575b80db65b2014ab0a7ff88520016866897e40c0e79a"}}