{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2012:NG4XAKHDS5QT7B3Q3L6SQO6FN3","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"0ab03253bc45649d1ea5448cec429c1dbb12298590af78e6803a7fd13247551e","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2012-08-28T13:23:29Z","title_canon_sha256":"f5c123d3b4bccba0176059b2e9ae2c0b86015e3b5f00ec29bc404f174865a638"},"schema_version":"1.0","source":{"id":"1208.5654","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1208.5654","created_at":"2026-05-18T03:46:48Z"},{"alias_kind":"arxiv_version","alias_value":"1208.5654v2","created_at":"2026-05-18T03:46:48Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1208.5654","created_at":"2026-05-18T03:46:48Z"},{"alias_kind":"pith_short_12","alias_value":"NG4XAKHDS5QT","created_at":"2026-05-18T12:27:16Z"},{"alias_kind":"pith_short_16","alias_value":"NG4XAKHDS5QT7B3Q","created_at":"2026-05-18T12:27:16Z"},{"alias_kind":"pith_short_8","alias_value":"NG4XAKHD","created_at":"2026-05-18T12:27:16Z"}],"graph_snapshots":[{"event_id":"sha256:cb065527b49dd3f04e2c8a777d31e476be341e5965ab17201062f2ca3ef9eaf1","target":"graph","created_at":"2026-05-18T03:46:48Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Divergence from a random baseline is a technique for the evaluation of document clustering. It ensures cluster quality measures are performing work that prevents ineffective clusterings from giving high scores to clusterings that provide no useful result. These concepts are defined and analysed using intrinsic and extrinsic approaches to the evaluation of document cluster quality. This includes the classical clusters to categories approach and a novel approach that uses ad hoc information retrieval. The divergence from a random baseline approach is able to differentiate ineffective clusterings","authors_text":"Andrew Trotman, Christopher M. De Vries, Shlomo Geva","cross_cats":["cs.AI"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2012-08-28T13:23:29Z","title":"Document Clustering Evaluation: Divergence from a Random Baseline"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1208.5654","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:6d90eca830cf8d2ac401046d071d9336d57257491066f74d8735d553d44c2719","target":"record","created_at":"2026-05-18T03:46:48Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"0ab03253bc45649d1ea5448cec429c1dbb12298590af78e6803a7fd13247551e","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2012-08-28T13:23:29Z","title_canon_sha256":"f5c123d3b4bccba0176059b2e9ae2c0b86015e3b5f00ec29bc404f174865a638"},"schema_version":"1.0","source":{"id":"1208.5654","kind":"arxiv","version":2}},"canonical_sha256":"69b97028e397613f8770dafd283bc56ec1649f561102ce8252d136a0cc6a49c3","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"69b97028e397613f8770dafd283bc56ec1649f561102ce8252d136a0cc6a49c3","first_computed_at":"2026-05-18T03:46:48.755411Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T03:46:48.755411Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"QW6fbfBmlS05DBakKBaEDKZP0rPPcSiCswp813HBCG9Q+fNL5iOd808nuNK7N3OqvHAtmUhxq5YSeY4SO1ptDA==","signature_status":"signed_v1","signed_at":"2026-05-18T03:46:48.756249Z","signed_message":"canonical_sha256_bytes"},"source_id":"1208.5654","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:6d90eca830cf8d2ac401046d071d9336d57257491066f74d8735d553d44c2719","sha256:cb065527b49dd3f04e2c8a777d31e476be341e5965ab17201062f2ca3ef9eaf1"],"state_sha256":"d3dac9af2302aa13c898903b2ffe636ecd2f932b1deafe8a274ac38c91acb730"}