{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2012:NOOUX2Y72UCGPAV7YKLGJKCSKL","short_pith_number":"pith:NOOUX2Y7","canonical_record":{"source":{"id":"1204.6703","kind":"arxiv","version":4},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2012-04-30T17:06:06Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"4db286cb10a698bedf04d4c1611434098056fb1e5e75f90ea55a0ae24e16512b","abstract_canon_sha256":"37030cf91a3ccc39cb661ed8fe49d02da82542e01a67ca603374b45bf092aa13"},"schema_version":"1.0"},"canonical_sha256":"6b9d4beb1fd5046782bfc29664a85252dd7dc1fc52ab3b9bd2bb026af3c250b7","source":{"kind":"arxiv","id":"1204.6703","version":4},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1204.6703","created_at":"2026-05-18T03:36:06Z"},{"alias_kind":"arxiv_version","alias_value":"1204.6703v4","created_at":"2026-05-18T03:36:06Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1204.6703","created_at":"2026-05-18T03:36:06Z"},{"alias_kind":"pith_short_12","alias_value":"NOOUX2Y72UCG","created_at":"2026-05-18T12:27:16Z"},{"alias_kind":"pith_short_16","alias_value":"NOOUX2Y72UCGPAV7","created_at":"2026-05-18T12:27:16Z"},{"alias_kind":"pith_short_8","alias_value":"NOOUX2Y7","created_at":"2026-05-18T12:27:16Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2012:NOOUX2Y72UCGPAV7YKLGJKCSKL","target":"record","payload":{"canonical_record":{"source":{"id":"1204.6703","kind":"arxiv","version":4},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2012-04-30T17:06:06Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"4db286cb10a698bedf04d4c1611434098056fb1e5e75f90ea55a0ae24e16512b","abstract_canon_sha256":"37030cf91a3ccc39cb661ed8fe49d02da82542e01a67ca603374b45bf092aa13"},"schema_version":"1.0"},"canonical_sha256":"6b9d4beb1fd5046782bfc29664a85252dd7dc1fc52ab3b9bd2bb026af3c250b7","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T03:36:06.449775Z","signature_b64":"rxAcHyOioZgFVuKNNrx8TWIlCPBI0eXKACSsFWuwkRgrtlQWAopa91qEk0sKItX/iacwvF7lSZPF5gzGHkRYAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"6b9d4beb1fd5046782bfc29664a85252dd7dc1fc52ab3b9bd2bb026af3c250b7","last_reissued_at":"2026-05-18T03:36:06.449026Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T03:36:06.449026Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1204.6703","source_version":4,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T03:36:06Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"4TBRe5qzM0DO6/aniwqmBiTFmsbZ16+hkZtrdZsEQ1LLBLbFTtvqISv1NsH7Erx/3wegbDi2LQetZAyPrdV9Bg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T12:42:12.160823Z"},"content_sha256":"869e221561d81bb239678d2c1ff4261bf13a056f908909db03118765bd91aab2","schema_version":"1.0","event_id":"sha256:869e221561d81bb239678d2c1ff4261bf13a056f908909db03118765bd91aab2"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2012:NOOUX2Y72UCGPAV7YKLGJKCSKL","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"A Spectral Algorithm for Latent Dirichlet Allocation","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["stat.ML"],"primary_cat":"cs.LG","authors_text":"Animashree Anandkumar, Daniel Hsu, Dean P. Foster, Sham M. Kakade, Yi-Kai Liu","submitted_at":"2012-04-30T17:06:06Z","abstract_excerpt":"The problem of topic modeling can be seen as a generalization of the clustering problem, in that it posits that observations are generated due to multiple latent factors (e.g., the words in each document are generated as a mixture of several active topics, as opposed to just one). This increased representational power comes at the cost of a more challenging unsupervised learning problem of estimating the topic probability vectors (the distributions over words for each topic), when only the words are observed and the corresponding topics are hidden.\n  We provide a simple and efficient learning "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1204.6703","kind":"arxiv","version":4},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T03:36:06Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"vI/rNhwfWhy+s6dnSQg1uyUaeDgafCvbQU6RNJye16q7TigStHY7oy+YPfmsu8szK1gOzMLdU85kdOrOXR4nDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T12:42:12.161242Z"},"content_sha256":"f0818c842830368de5c5c9b7881d9202cd930b0baefdf55d8133e9a4d67da9fd","schema_version":"1.0","event_id":"sha256:f0818c842830368de5c5c9b7881d9202cd930b0baefdf55d8133e9a4d67da9fd"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/NOOUX2Y72UCGPAV7YKLGJKCSKL/bundle.json","state_url":"https://pith.science/pith/NOOUX2Y72UCGPAV7YKLGJKCSKL/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/NOOUX2Y72UCGPAV7YKLGJKCSKL/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-25T12:42:12Z","links":{"resolver":"https://pith.science/pith/NOOUX2Y72UCGPAV7YKLGJKCSKL","bundle":"https://pith.science/pith/NOOUX2Y72UCGPAV7YKLGJKCSKL/bundle.json","state":"https://pith.science/pith/NOOUX2Y72UCGPAV7YKLGJKCSKL/state.json","well_known_bundle":"https://pith.science/.well-known/pith/NOOUX2Y72UCGPAV7YKLGJKCSKL/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2012:NOOUX2Y72UCGPAV7YKLGJKCSKL","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"37030cf91a3ccc39cb661ed8fe49d02da82542e01a67ca603374b45bf092aa13","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2012-04-30T17:06:06Z","title_canon_sha256":"4db286cb10a698bedf04d4c1611434098056fb1e5e75f90ea55a0ae24e16512b"},"schema_version":"1.0","source":{"id":"1204.6703","kind":"arxiv","version":4}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1204.6703","created_at":"2026-05-18T03:36:06Z"},{"alias_kind":"arxiv_version","alias_value":"1204.6703v4","created_at":"2026-05-18T03:36:06Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1204.6703","created_at":"2026-05-18T03:36:06Z"},{"alias_kind":"pith_short_12","alias_value":"NOOUX2Y72UCG","created_at":"2026-05-18T12:27:16Z"},{"alias_kind":"pith_short_16","alias_value":"NOOUX2Y72UCGPAV7","created_at":"2026-05-18T12:27:16Z"},{"alias_kind":"pith_short_8","alias_value":"NOOUX2Y7","created_at":"2026-05-18T12:27:16Z"}],"graph_snapshots":[{"event_id":"sha256:f0818c842830368de5c5c9b7881d9202cd930b0baefdf55d8133e9a4d67da9fd","target":"graph","created_at":"2026-05-18T03:36:06Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"The problem of topic modeling can be seen as a generalization of the clustering problem, in that it posits that observations are generated due to multiple latent factors (e.g., the words in each document are generated as a mixture of several active topics, as opposed to just one). This increased representational power comes at the cost of a more challenging unsupervised learning problem of estimating the topic probability vectors (the distributions over words for each topic), when only the words are observed and the corresponding topics are hidden.\n  We provide a simple and efficient learning ","authors_text":"Animashree Anandkumar, Daniel Hsu, Dean P. Foster, Sham M. Kakade, Yi-Kai Liu","cross_cats":["stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2012-04-30T17:06:06Z","title":"A Spectral Algorithm for Latent Dirichlet Allocation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1204.6703","kind":"arxiv","version":4},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:869e221561d81bb239678d2c1ff4261bf13a056f908909db03118765bd91aab2","target":"record","created_at":"2026-05-18T03:36:06Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"37030cf91a3ccc39cb661ed8fe49d02da82542e01a67ca603374b45bf092aa13","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2012-04-30T17:06:06Z","title_canon_sha256":"4db286cb10a698bedf04d4c1611434098056fb1e5e75f90ea55a0ae24e16512b"},"schema_version":"1.0","source":{"id":"1204.6703","kind":"arxiv","version":4}},"canonical_sha256":"6b9d4beb1fd5046782bfc29664a85252dd7dc1fc52ab3b9bd2bb026af3c250b7","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"6b9d4beb1fd5046782bfc29664a85252dd7dc1fc52ab3b9bd2bb026af3c250b7","first_computed_at":"2026-05-18T03:36:06.449026Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T03:36:06.449026Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"rxAcHyOioZgFVuKNNrx8TWIlCPBI0eXKACSsFWuwkRgrtlQWAopa91qEk0sKItX/iacwvF7lSZPF5gzGHkRYAQ==","signature_status":"signed_v1","signed_at":"2026-05-18T03:36:06.449775Z","signed_message":"canonical_sha256_bytes"},"source_id":"1204.6703","source_kind":"arxiv","source_version":4}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:869e221561d81bb239678d2c1ff4261bf13a056f908909db03118765bd91aab2","sha256:f0818c842830368de5c5c9b7881d9202cd930b0baefdf55d8133e9a4d67da9fd"],"state_sha256":"1bfcb014114f1becf62fe741d4491d75a95d15c0b61aa80a41bd0a7cf2272042"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"STl/Mho01mhDZx1IdNEHphSEBN211uRbYsUvVj+4/54Rdc8w2eIaOKwqmG0hGViIJe/5dcr3Hl11YAjz/19BAQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-25T12:42:12.163898Z","bundle_sha256":"e8d9e8a5a704da071ad7b25cb6269c358940d25a09b64913f46743608e27893d"}}