{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2015:7BUIC52KGTKDU6CRW4ETTAN3ZD","short_pith_number":"pith:7BUIC52K","canonical_record":{"source":{"id":"1502.02312","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.AP","submitted_at":"2015-02-08T22:42:42Z","cross_cats_sorted":[],"title_canon_sha256":"b08b9cc5cdffa44a51cfd495b73600eae10dd1b216a1b40449cbdba760e6d441","abstract_canon_sha256":"744ddd9ea91e9dd338847cf5f5e686582e401df56d18b533dcf2eb668e6a8a5a"},"schema_version":"1.0"},"canonical_sha256":"f86881774a34d43a7851b7093981bbc8c9cc145cec66d3d198f93e8392044a33","source":{"kind":"arxiv","id":"1502.02312","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1502.02312","created_at":"2026-05-18T02:07:26Z"},{"alias_kind":"arxiv_version","alias_value":"1502.02312v2","created_at":"2026-05-18T02:07:26Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1502.02312","created_at":"2026-05-18T02:07:26Z"},{"alias_kind":"pith_short_12","alias_value":"7BUIC52KGTKD","created_at":"2026-05-18T12:29:07Z"},{"alias_kind":"pith_short_16","alias_value":"7BUIC52KGTKDU6CR","created_at":"2026-05-18T12:29:07Z"},{"alias_kind":"pith_short_8","alias_value":"7BUIC52K","created_at":"2026-05-18T12:29:07Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2015:7BUIC52KGTKDU6CRW4ETTAN3ZD","target":"record","payload":{"canonical_record":{"source":{"id":"1502.02312","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.AP","submitted_at":"2015-02-08T22:42:42Z","cross_cats_sorted":[],"title_canon_sha256":"b08b9cc5cdffa44a51cfd495b73600eae10dd1b216a1b40449cbdba760e6d441","abstract_canon_sha256":"744ddd9ea91e9dd338847cf5f5e686582e401df56d18b533dcf2eb668e6a8a5a"},"schema_version":"1.0"},"canonical_sha256":"f86881774a34d43a7851b7093981bbc8c9cc145cec66d3d198f93e8392044a33","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T02:07:26.487285Z","signature_b64":"6pBSTPkkycPArJUH0GlOOGolB0bsCPWF+KSOFa8RW2B6SH/VxetTqVcR5a8sTuOBV4KlCkC3qfVxJIKI3EFZAg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f86881774a34d43a7851b7093981bbc8c9cc145cec66d3d198f93e8392044a33","last_reissued_at":"2026-05-18T02:07:26.486886Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T02:07:26.486886Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1502.02312","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:07:26Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"H0kRmHbfgtBeZKhspFya9KL6N3gsQ2NLbGrhjGgTdq8aBYNVz+9AVWSD6VdfDK2/733hu5dBBStrtaEIe1NHAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-28T10:35:22.245590Z"},"content_sha256":"b396221f11e690960f8c5eccfe6a8c4d87fd7e6daa9799312d69eaa0dbbab208","schema_version":"1.0","event_id":"sha256:b396221f11e690960f8c5eccfe6a8c4d87fd7e6daa9799312d69eaa0dbbab208"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2015:7BUIC52KGTKDU6CRW4ETTAN3ZD","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Bayesian and empirical Bayesian forests","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"stat.AP","authors_text":"Chun-Sheng Chen, Jun Yu, Matt Taddy, Mitch Wyle","submitted_at":"2015-02-08T22:42:42Z","abstract_excerpt":"We derive ensembles of decision trees through a nonparametric Bayesian model, allowing us to view random forests as samples from a posterior distribution. This insight provides large gains in interpretability, and motivates a class of Bayesian forest (BF) algorithms that yield small but reliable performance gains. Based on the BF framework, we are able to show that high-level tree hierarchy is stable in large samples. This leads to an empirical Bayesian forest (EBF) algorithm for building approximate BFs on massive distributed datasets and we show that EBFs outperform sub-sampling based altern"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1502.02312","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:07:26Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"IDS3jlm5+RO+KOtboaaZFqfzDpy45J5hu+V3W87HXG4GA6TCQDoxewjm/v1ua/e/Uw9lA2zHbnlOBgxiRBcVAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-28T10:35:22.245929Z"},"content_sha256":"74ea13d52733ab55ffbd6aebb3e4679b7beac4adb2f98dd2b13b351aa71877ce","schema_version":"1.0","event_id":"sha256:74ea13d52733ab55ffbd6aebb3e4679b7beac4adb2f98dd2b13b351aa71877ce"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/7BUIC52KGTKDU6CRW4ETTAN3ZD/bundle.json","state_url":"https://pith.science/pith/7BUIC52KGTKDU6CRW4ETTAN3ZD/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/7BUIC52KGTKDU6CRW4ETTAN3ZD/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-28T10:35:22Z","links":{"resolver":"https://pith.science/pith/7BUIC52KGTKDU6CRW4ETTAN3ZD","bundle":"https://pith.science/pith/7BUIC52KGTKDU6CRW4ETTAN3ZD/bundle.json","state":"https://pith.science/pith/7BUIC52KGTKDU6CRW4ETTAN3ZD/state.json","well_known_bundle":"https://pith.science/.well-known/pith/7BUIC52KGTKDU6CRW4ETTAN3ZD/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2015:7BUIC52KGTKDU6CRW4ETTAN3ZD","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"744ddd9ea91e9dd338847cf5f5e686582e401df56d18b533dcf2eb668e6a8a5a","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.AP","submitted_at":"2015-02-08T22:42:42Z","title_canon_sha256":"b08b9cc5cdffa44a51cfd495b73600eae10dd1b216a1b40449cbdba760e6d441"},"schema_version":"1.0","source":{"id":"1502.02312","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1502.02312","created_at":"2026-05-18T02:07:26Z"},{"alias_kind":"arxiv_version","alias_value":"1502.02312v2","created_at":"2026-05-18T02:07:26Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1502.02312","created_at":"2026-05-18T02:07:26Z"},{"alias_kind":"pith_short_12","alias_value":"7BUIC52KGTKD","created_at":"2026-05-18T12:29:07Z"},{"alias_kind":"pith_short_16","alias_value":"7BUIC52KGTKDU6CR","created_at":"2026-05-18T12:29:07Z"},{"alias_kind":"pith_short_8","alias_value":"7BUIC52K","created_at":"2026-05-18T12:29:07Z"}],"graph_snapshots":[{"event_id":"sha256:74ea13d52733ab55ffbd6aebb3e4679b7beac4adb2f98dd2b13b351aa71877ce","target":"graph","created_at":"2026-05-18T02:07:26Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We derive ensembles of decision trees through a nonparametric Bayesian model, allowing us to view random forests as samples from a posterior distribution. This insight provides large gains in interpretability, and motivates a class of Bayesian forest (BF) algorithms that yield small but reliable performance gains. Based on the BF framework, we are able to show that high-level tree hierarchy is stable in large samples. This leads to an empirical Bayesian forest (EBF) algorithm for building approximate BFs on massive distributed datasets and we show that EBFs outperform sub-sampling based altern","authors_text":"Chun-Sheng Chen, Jun Yu, Matt Taddy, Mitch Wyle","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.AP","submitted_at":"2015-02-08T22:42:42Z","title":"Bayesian and empirical Bayesian forests"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1502.02312","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:b396221f11e690960f8c5eccfe6a8c4d87fd7e6daa9799312d69eaa0dbbab208","target":"record","created_at":"2026-05-18T02:07:26Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"744ddd9ea91e9dd338847cf5f5e686582e401df56d18b533dcf2eb668e6a8a5a","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.AP","submitted_at":"2015-02-08T22:42:42Z","title_canon_sha256":"b08b9cc5cdffa44a51cfd495b73600eae10dd1b216a1b40449cbdba760e6d441"},"schema_version":"1.0","source":{"id":"1502.02312","kind":"arxiv","version":2}},"canonical_sha256":"f86881774a34d43a7851b7093981bbc8c9cc145cec66d3d198f93e8392044a33","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"f86881774a34d43a7851b7093981bbc8c9cc145cec66d3d198f93e8392044a33","first_computed_at":"2026-05-18T02:07:26.486886Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T02:07:26.486886Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"6pBSTPkkycPArJUH0GlOOGolB0bsCPWF+KSOFa8RW2B6SH/VxetTqVcR5a8sTuOBV4KlCkC3qfVxJIKI3EFZAg==","signature_status":"signed_v1","signed_at":"2026-05-18T02:07:26.487285Z","signed_message":"canonical_sha256_bytes"},"source_id":"1502.02312","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:b396221f11e690960f8c5eccfe6a8c4d87fd7e6daa9799312d69eaa0dbbab208","sha256:74ea13d52733ab55ffbd6aebb3e4679b7beac4adb2f98dd2b13b351aa71877ce"],"state_sha256":"3b8c30d7289de07e9a9ebcb837a879f3d9cadc1053d4a9653318a916c34eff84"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ABh/wpD+HhaqRtPgnakZ8dlSB1AM3uM6FfKjYM350n5uUy9Oip1YDXYKw7jJ9alLAJxLSMMmkXOGE5RRHk9nBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-28T10:35:22.247837Z","bundle_sha256":"f747e71728fa01d7b77a4afd40419245289c163b1b661eeba2ea5a70c89fadb8"}}