{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2013:SEF7LI3EQASIUQUGIWXIHJLJIT","short_pith_number":"pith:SEF7LI3E","canonical_record":{"source":{"id":"1310.0509","kind":"arxiv","version":4},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/3.0/","primary_cat":"cs.LG","submitted_at":"2013-10-01T22:34:18Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"ce100191816afb4c365f47ca2d4104539ccf952fcafb841f1f4f3ad923f361c6","abstract_canon_sha256":"bb7a53d23d4bb44849723238dbea9ad85d1cef874620a1b70db1576248c9e7dd"},"schema_version":"1.0"},"canonical_sha256":"910bf5a36480248a428645ae83a56944f4bd17ec52ae8fdf99bd591eb17e0077","source":{"kind":"arxiv","id":"1310.0509","version":4},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1310.0509","created_at":"2026-05-18T03:06:21Z"},{"alias_kind":"arxiv_version","alias_value":"1310.0509v4","created_at":"2026-05-18T03:06:21Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1310.0509","created_at":"2026-05-18T03:06:21Z"},{"alias_kind":"pith_short_12","alias_value":"SEF7LI3EQASI","created_at":"2026-05-18T12:27:59Z"},{"alias_kind":"pith_short_16","alias_value":"SEF7LI3EQASIUQUG","created_at":"2026-05-18T12:27:59Z"},{"alias_kind":"pith_short_8","alias_value":"SEF7LI3E","created_at":"2026-05-18T12:27:59Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2013:SEF7LI3EQASIUQUGIWXIHJLJIT","target":"record","payload":{"canonical_record":{"source":{"id":"1310.0509","kind":"arxiv","version":4},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/3.0/","primary_cat":"cs.LG","submitted_at":"2013-10-01T22:34:18Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"ce100191816afb4c365f47ca2d4104539ccf952fcafb841f1f4f3ad923f361c6","abstract_canon_sha256":"bb7a53d23d4bb44849723238dbea9ad85d1cef874620a1b70db1576248c9e7dd"},"schema_version":"1.0"},"canonical_sha256":"910bf5a36480248a428645ae83a56944f4bd17ec52ae8fdf99bd591eb17e0077","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T03:06:21.584090Z","signature_b64":"0VAbnkHGH7Cp5mfpLD9dBb60VSzHlkzblxoNFYL+7Gj7blrQYb1TD4K9njASmmamY2YZqHjhDbJmARpp2fckBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"910bf5a36480248a428645ae83a56944f4bd17ec52ae8fdf99bd591eb17e0077","last_reissued_at":"2026-05-18T03:06:21.583481Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T03:06:21.583481Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1310.0509","source_version":4,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T03:06:21Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"+WoAUbUAb0TJKEKOLyfe50g9rP+wjz6yWD5e0uo/sejc+lLNtznTRg3ODgVE2ZRTNvhPAzv0IdeVEd+RKz8PCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-04T18:30:24.526721Z"},"content_sha256":"abf17477efbdc32cfd342ec9bef6f7fe0a96fd55915d433ef0f9c4c95b3b8716","schema_version":"1.0","event_id":"sha256:abf17477efbdc32cfd342ec9bef6f7fe0a96fd55915d433ef0f9c4c95b3b8716"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2013:SEF7LI3EQASIUQUGIWXIHJLJIT","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Summary Statistics for Partitionings and Feature Allocations","license":"http://creativecommons.org/licenses/by-nc-sa/3.0/","headline":"","cross_cats":["stat.ML"],"primary_cat":"cs.LG","authors_text":"Ali Taylan Cemgil, I\\c{s}{\\i}k Bar{\\i}\\c{s} Fidaner","submitted_at":"2013-10-01T22:34:18Z","abstract_excerpt":"Infinite mixture models are commonly used for clustering. One can sample from the posterior of mixture assignments by Monte Carlo methods or find its maximum a posteriori solution by optimization. However, in some problems the posterior is diffuse and it is hard to interpret the sampled partitionings. In this paper, we introduce novel statistics based on block sizes for representing sample sets of partitionings and feature allocations. We develop an element-based definition of entropy to quantify segmentation among their elements. Then we propose a simple algorithm called entropy agglomeration"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1310.0509","kind":"arxiv","version":4},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T03:06:21Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ysroKybGFiUa821dz7SbbjSzPbuvFrzod4LSuhHrVemQnRRAtIhhoLi4qGo+k39gIVlz1IjNBkJd1r2a/Z8mBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-04T18:30:24.527064Z"},"content_sha256":"e048ff064576be4105f22ad2e70a8873b9bbf0867b80c43c5ea0ee118eae251b","schema_version":"1.0","event_id":"sha256:e048ff064576be4105f22ad2e70a8873b9bbf0867b80c43c5ea0ee118eae251b"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/SEF7LI3EQASIUQUGIWXIHJLJIT/bundle.json","state_url":"https://pith.science/pith/SEF7LI3EQASIUQUGIWXIHJLJIT/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/SEF7LI3EQASIUQUGIWXIHJLJIT/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-04T18:30:24Z","links":{"resolver":"https://pith.science/pith/SEF7LI3EQASIUQUGIWXIHJLJIT","bundle":"https://pith.science/pith/SEF7LI3EQASIUQUGIWXIHJLJIT/bundle.json","state":"https://pith.science/pith/SEF7LI3EQASIUQUGIWXIHJLJIT/state.json","well_known_bundle":"https://pith.science/.well-known/pith/SEF7LI3EQASIUQUGIWXIHJLJIT/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2013:SEF7LI3EQASIUQUGIWXIHJLJIT","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"bb7a53d23d4bb44849723238dbea9ad85d1cef874620a1b70db1576248c9e7dd","cross_cats_sorted":["stat.ML"],"license":"http://creativecommons.org/licenses/by-nc-sa/3.0/","primary_cat":"cs.LG","submitted_at":"2013-10-01T22:34:18Z","title_canon_sha256":"ce100191816afb4c365f47ca2d4104539ccf952fcafb841f1f4f3ad923f361c6"},"schema_version":"1.0","source":{"id":"1310.0509","kind":"arxiv","version":4}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1310.0509","created_at":"2026-05-18T03:06:21Z"},{"alias_kind":"arxiv_version","alias_value":"1310.0509v4","created_at":"2026-05-18T03:06:21Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1310.0509","created_at":"2026-05-18T03:06:21Z"},{"alias_kind":"pith_short_12","alias_value":"SEF7LI3EQASI","created_at":"2026-05-18T12:27:59Z"},{"alias_kind":"pith_short_16","alias_value":"SEF7LI3EQASIUQUG","created_at":"2026-05-18T12:27:59Z"},{"alias_kind":"pith_short_8","alias_value":"SEF7LI3E","created_at":"2026-05-18T12:27:59Z"}],"graph_snapshots":[{"event_id":"sha256:e048ff064576be4105f22ad2e70a8873b9bbf0867b80c43c5ea0ee118eae251b","target":"graph","created_at":"2026-05-18T03:06:21Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Infinite mixture models are commonly used for clustering. One can sample from the posterior of mixture assignments by Monte Carlo methods or find its maximum a posteriori solution by optimization. However, in some problems the posterior is diffuse and it is hard to interpret the sampled partitionings. In this paper, we introduce novel statistics based on block sizes for representing sample sets of partitionings and feature allocations. We develop an element-based definition of entropy to quantify segmentation among their elements. Then we propose a simple algorithm called entropy agglomeration","authors_text":"Ali Taylan Cemgil, I\\c{s}{\\i}k Bar{\\i}\\c{s} Fidaner","cross_cats":["stat.ML"],"headline":"","license":"http://creativecommons.org/licenses/by-nc-sa/3.0/","primary_cat":"cs.LG","submitted_at":"2013-10-01T22:34:18Z","title":"Summary Statistics for Partitionings and Feature Allocations"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1310.0509","kind":"arxiv","version":4},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:abf17477efbdc32cfd342ec9bef6f7fe0a96fd55915d433ef0f9c4c95b3b8716","target":"record","created_at":"2026-05-18T03:06:21Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"bb7a53d23d4bb44849723238dbea9ad85d1cef874620a1b70db1576248c9e7dd","cross_cats_sorted":["stat.ML"],"license":"http://creativecommons.org/licenses/by-nc-sa/3.0/","primary_cat":"cs.LG","submitted_at":"2013-10-01T22:34:18Z","title_canon_sha256":"ce100191816afb4c365f47ca2d4104539ccf952fcafb841f1f4f3ad923f361c6"},"schema_version":"1.0","source":{"id":"1310.0509","kind":"arxiv","version":4}},"canonical_sha256":"910bf5a36480248a428645ae83a56944f4bd17ec52ae8fdf99bd591eb17e0077","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"910bf5a36480248a428645ae83a56944f4bd17ec52ae8fdf99bd591eb17e0077","first_computed_at":"2026-05-18T03:06:21.583481Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T03:06:21.583481Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"0VAbnkHGH7Cp5mfpLD9dBb60VSzHlkzblxoNFYL+7Gj7blrQYb1TD4K9njASmmamY2YZqHjhDbJmARpp2fckBw==","signature_status":"signed_v1","signed_at":"2026-05-18T03:06:21.584090Z","signed_message":"canonical_sha256_bytes"},"source_id":"1310.0509","source_kind":"arxiv","source_version":4}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:abf17477efbdc32cfd342ec9bef6f7fe0a96fd55915d433ef0f9c4c95b3b8716","sha256:e048ff064576be4105f22ad2e70a8873b9bbf0867b80c43c5ea0ee118eae251b"],"state_sha256":"bcae3b78a4ff5d0b0907769e5a0ade6faf8cc41ce050938b243a7824e6fd2fb0"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"IUxe2+3jnjRrY7w4PmTny+oLqQ6zNEppXAHnAv00kXRB1bxOvcC+O8E9vWPVm+hc5PGFKX2QbitJPVboImoUDQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-04T18:30:24.529097Z","bundle_sha256":"339e4b88ed7ec192a562df4a5266faf8982dd2dfa8a0302ad63443967840310f"}}