{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:QBPHCYCZDIYFY5DATSSDJ5OBV5","short_pith_number":"pith:QBPHCYCZ","canonical_record":{"source":{"id":"1609.06783","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2016-09-22T00:10:16Z","cross_cats_sorted":["cs.CL","cs.LG"],"title_canon_sha256":"a7e84d4cd485b3c782a361288ff61b097bacfe44bc3f0cacceeb1fba61a0bb5d","abstract_canon_sha256":"7258b90f2f208323298bc1ff8b708617526aaf2e791236795aa215d01e37f0f9"},"schema_version":"1.0"},"canonical_sha256":"805e7160591a305c74609ca434f5c1af798ac5e6f748cfff4aa2730ad97837f7","source":{"kind":"arxiv","id":"1609.06783","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1609.06783","created_at":"2026-05-18T01:04:05Z"},{"alias_kind":"arxiv_version","alias_value":"1609.06783v1","created_at":"2026-05-18T01:04:05Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1609.06783","created_at":"2026-05-18T01:04:05Z"},{"alias_kind":"pith_short_12","alias_value":"QBPHCYCZDIYF","created_at":"2026-05-18T12:30:39Z"},{"alias_kind":"pith_short_16","alias_value":"QBPHCYCZDIYFY5DA","created_at":"2026-05-18T12:30:39Z"},{"alias_kind":"pith_short_8","alias_value":"QBPHCYCZ","created_at":"2026-05-18T12:30:39Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:QBPHCYCZDIYFY5DATSSDJ5OBV5","target":"record","payload":{"canonical_record":{"source":{"id":"1609.06783","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2016-09-22T00:10:16Z","cross_cats_sorted":["cs.CL","cs.LG"],"title_canon_sha256":"a7e84d4cd485b3c782a361288ff61b097bacfe44bc3f0cacceeb1fba61a0bb5d","abstract_canon_sha256":"7258b90f2f208323298bc1ff8b708617526aaf2e791236795aa215d01e37f0f9"},"schema_version":"1.0"},"canonical_sha256":"805e7160591a305c74609ca434f5c1af798ac5e6f748cfff4aa2730ad97837f7","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:04:05.105825Z","signature_b64":"0eU0ESTYLuytQ98iPtk97uDwuwsuDR6m2MeUF9uBvgo40h6Jq+0wa0PSA+zfMFTqzn9RlZD/ydJUXGlI3innDg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"805e7160591a305c74609ca434f5c1af798ac5e6f748cfff4aa2730ad97837f7","last_reissued_at":"2026-05-18T01:04:05.105270Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:04:05.105270Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1609.06783","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:04:05Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"e4wC81Wv0/WOfuH6/a2EHyW9smz+9XG8H4XvFotL5AnfYTsuhpPC5KTcT1NhX0sCQlC2GFvXLvAtNMWpj17yCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T04:41:29.951556Z"},"content_sha256":"76a47849ced9cc7eb5c3cdec84dfafba8718af12fe2bd653c5df4ffcbac67c25","schema_version":"1.0","event_id":"sha256:76a47849ced9cc7eb5c3cdec84dfafba8718af12fe2bd653c5df4ffcbac67c25"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:QBPHCYCZDIYFY5DATSSDJ5OBV5","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Nonparametric Bayesian Topic Modelling with the Hierarchical Pitman-Yor Processes","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CL","cs.LG"],"primary_cat":"stat.ML","authors_text":"Changyou Chen, Kar Wai Lim, Lan Du, Wray Buntine","submitted_at":"2016-09-22T00:10:16Z","abstract_excerpt":"The Dirichlet process and its extension, the Pitman-Yor process, are stochastic processes that take probability distributions as a parameter. These processes can be stacked up to form a hierarchical nonparametric Bayesian model. In this article, we present efficient methods for the use of these processes in this hierarchical context, and apply them to latent variable models for text analytics. In particular, we propose a general framework for designing these Bayesian models, which are called topic models in the computer science community. We then propose a specific nonparametric Bayesian topic"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1609.06783","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:04:05Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"xCy5xbBbFA7kbg2aoTYEjGQXMApWZYsq6HzzXvxj9f4Jt4bI9zzMKs+qkfai4SegWi1eFcdyRaMMirOUbUuHCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T04:41:29.952243Z"},"content_sha256":"24839923aa3a40d467238a0bef356b0c7278736211e53eb7fabc2d71283a6775","schema_version":"1.0","event_id":"sha256:24839923aa3a40d467238a0bef356b0c7278736211e53eb7fabc2d71283a6775"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/QBPHCYCZDIYFY5DATSSDJ5OBV5/bundle.json","state_url":"https://pith.science/pith/QBPHCYCZDIYFY5DATSSDJ5OBV5/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/QBPHCYCZDIYFY5DATSSDJ5OBV5/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-26T04:41:29Z","links":{"resolver":"https://pith.science/pith/QBPHCYCZDIYFY5DATSSDJ5OBV5","bundle":"https://pith.science/pith/QBPHCYCZDIYFY5DATSSDJ5OBV5/bundle.json","state":"https://pith.science/pith/QBPHCYCZDIYFY5DATSSDJ5OBV5/state.json","well_known_bundle":"https://pith.science/.well-known/pith/QBPHCYCZDIYFY5DATSSDJ5OBV5/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:QBPHCYCZDIYFY5DATSSDJ5OBV5","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7258b90f2f208323298bc1ff8b708617526aaf2e791236795aa215d01e37f0f9","cross_cats_sorted":["cs.CL","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2016-09-22T00:10:16Z","title_canon_sha256":"a7e84d4cd485b3c782a361288ff61b097bacfe44bc3f0cacceeb1fba61a0bb5d"},"schema_version":"1.0","source":{"id":"1609.06783","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1609.06783","created_at":"2026-05-18T01:04:05Z"},{"alias_kind":"arxiv_version","alias_value":"1609.06783v1","created_at":"2026-05-18T01:04:05Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1609.06783","created_at":"2026-05-18T01:04:05Z"},{"alias_kind":"pith_short_12","alias_value":"QBPHCYCZDIYF","created_at":"2026-05-18T12:30:39Z"},{"alias_kind":"pith_short_16","alias_value":"QBPHCYCZDIYFY5DA","created_at":"2026-05-18T12:30:39Z"},{"alias_kind":"pith_short_8","alias_value":"QBPHCYCZ","created_at":"2026-05-18T12:30:39Z"}],"graph_snapshots":[{"event_id":"sha256:24839923aa3a40d467238a0bef356b0c7278736211e53eb7fabc2d71283a6775","target":"graph","created_at":"2026-05-18T01:04:05Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"The Dirichlet process and its extension, the Pitman-Yor process, are stochastic processes that take probability distributions as a parameter. These processes can be stacked up to form a hierarchical nonparametric Bayesian model. In this article, we present efficient methods for the use of these processes in this hierarchical context, and apply them to latent variable models for text analytics. In particular, we propose a general framework for designing these Bayesian models, which are called topic models in the computer science community. We then propose a specific nonparametric Bayesian topic","authors_text":"Changyou Chen, Kar Wai Lim, Lan Du, Wray Buntine","cross_cats":["cs.CL","cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2016-09-22T00:10:16Z","title":"Nonparametric Bayesian Topic Modelling with the Hierarchical Pitman-Yor Processes"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1609.06783","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:76a47849ced9cc7eb5c3cdec84dfafba8718af12fe2bd653c5df4ffcbac67c25","target":"record","created_at":"2026-05-18T01:04:05Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7258b90f2f208323298bc1ff8b708617526aaf2e791236795aa215d01e37f0f9","cross_cats_sorted":["cs.CL","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2016-09-22T00:10:16Z","title_canon_sha256":"a7e84d4cd485b3c782a361288ff61b097bacfe44bc3f0cacceeb1fba61a0bb5d"},"schema_version":"1.0","source":{"id":"1609.06783","kind":"arxiv","version":1}},"canonical_sha256":"805e7160591a305c74609ca434f5c1af798ac5e6f748cfff4aa2730ad97837f7","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"805e7160591a305c74609ca434f5c1af798ac5e6f748cfff4aa2730ad97837f7","first_computed_at":"2026-05-18T01:04:05.105270Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:04:05.105270Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"0eU0ESTYLuytQ98iPtk97uDwuwsuDR6m2MeUF9uBvgo40h6Jq+0wa0PSA+zfMFTqzn9RlZD/ydJUXGlI3innDg==","signature_status":"signed_v1","signed_at":"2026-05-18T01:04:05.105825Z","signed_message":"canonical_sha256_bytes"},"source_id":"1609.06783","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:76a47849ced9cc7eb5c3cdec84dfafba8718af12fe2bd653c5df4ffcbac67c25","sha256:24839923aa3a40d467238a0bef356b0c7278736211e53eb7fabc2d71283a6775"],"state_sha256":"e363b23913400d052ac9b4cdc4e6cdad89aa238bde84254c8d4a8a33c47a6d98"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"VymHT4GgYBdHUe2T0OqDdDKOu6Ojf7MDMg7Qb7NauBYVJpjNeviH0/1gE9IGvmV5MdSKU3aO5Bc57PqBowXPBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-26T04:41:29.956216Z","bundle_sha256":"00d63f09c12cf6e5a46b3b06b67e0f68c8fee96cebc842bebff99cad81c659a0"}}