{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:UIMMJSIDUEPESP4JNCWCYSWX2M","short_pith_number":"pith:UIMMJSID","canonical_record":{"source":{"id":"1905.12753","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DS","submitted_at":"2019-05-29T22:21:47Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"2be6d3b266f2525ce6b4df24c28bf4c0fc45f2168ea058178011888746c8bbcf","abstract_canon_sha256":"d7a071710dd60291e9ec76f0bcb764d31c52f34654b70e42357124c2cb066df7"},"schema_version":"1.0"},"canonical_sha256":"a218c4c903a11e493f8968ac2c4ad7d30d9fb6893cd1aedcf71b4874ba48e6b2","source":{"kind":"arxiv","id":"1905.12753","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1905.12753","created_at":"2026-05-17T23:44:39Z"},{"alias_kind":"arxiv_version","alias_value":"1905.12753v1","created_at":"2026-05-17T23:44:39Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1905.12753","created_at":"2026-05-17T23:44:39Z"},{"alias_kind":"pith_short_12","alias_value":"UIMMJSIDUEPE","created_at":"2026-05-18T12:33:30Z"},{"alias_kind":"pith_short_16","alias_value":"UIMMJSIDUEPESP4J","created_at":"2026-05-18T12:33:30Z"},{"alias_kind":"pith_short_8","alias_value":"UIMMJSID","created_at":"2026-05-18T12:33:30Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:UIMMJSIDUEPESP4JNCWCYSWX2M","target":"record","payload":{"canonical_record":{"source":{"id":"1905.12753","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DS","submitted_at":"2019-05-29T22:21:47Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"2be6d3b266f2525ce6b4df24c28bf4c0fc45f2168ea058178011888746c8bbcf","abstract_canon_sha256":"d7a071710dd60291e9ec76f0bcb764d31c52f34654b70e42357124c2cb066df7"},"schema_version":"1.0"},"canonical_sha256":"a218c4c903a11e493f8968ac2c4ad7d30d9fb6893cd1aedcf71b4874ba48e6b2","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:44:39.737798Z","signature_b64":"Rx1i7hDdXO9oCCaVPo9GO4atnXJiGjgowTJTzcD+w1+eTRdjYL0R7Di0uzxm/euB6huaNNCsRnB55OtQshJECQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"a218c4c903a11e493f8968ac2c4ad7d30d9fb6893cd1aedcf71b4874ba48e6b2","last_reissued_at":"2026-05-17T23:44:39.737332Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:44:39.737332Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1905.12753","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:44:39Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"6iMrgKkJAaEFZjNKp77HSbphyB6L5tcFyWPpnEn0H4laOYXF681HajBBrSkx8j2gwDdc4L8mktxEguleTAP1DA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T23:04:52.439004Z"},"content_sha256":"10af9a070267b5b64c772606a11dcd5675045e23eb483d2437ac1999af7c6e77","schema_version":"1.0","event_id":"sha256:10af9a070267b5b64c772606a11dcd5675045e23eb483d2437ac1999af7c6e77"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:UIMMJSIDUEPESP4JNCWCYSWX2M","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Clustering without Over-Representation","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"cs.DS","authors_text":"Alessandro Epasto, Mohammad Mahdian, Ravi Kumar, Sara Ahmadian","submitted_at":"2019-05-29T22:21:47Z","abstract_excerpt":"In this paper we consider clustering problems in which each point is endowed with a color. The goal is to cluster the points to minimize the classical clustering cost but with the additional constraint that no color is over-represented in any cluster. This problem is motivated by practical clustering settings, e.g., in clustering news articles where the color of an article is its source, it is preferable that no single news source dominates any cluster.\n  For the most general version of this problem, we obtain an algorithm that has provable guarantees of performance; our algorithm is based on "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1905.12753","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:44:39Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ZOt9GrN1YtdSNsMkp7qaRVI863siN1KSZJnfL8X+8oVwyOPRIpA2KvzgNc/08LVxqEJWzlKiAUedf3ELf4ddDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T23:04:52.439738Z"},"content_sha256":"d3c3411eaac2ec11385d6884c7af493160b15ba38266040c177b2ef9e70f81b8","schema_version":"1.0","event_id":"sha256:d3c3411eaac2ec11385d6884c7af493160b15ba38266040c177b2ef9e70f81b8"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/UIMMJSIDUEPESP4JNCWCYSWX2M/bundle.json","state_url":"https://pith.science/pith/UIMMJSIDUEPESP4JNCWCYSWX2M/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/UIMMJSIDUEPESP4JNCWCYSWX2M/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-31T23:04:52Z","links":{"resolver":"https://pith.science/pith/UIMMJSIDUEPESP4JNCWCYSWX2M","bundle":"https://pith.science/pith/UIMMJSIDUEPESP4JNCWCYSWX2M/bundle.json","state":"https://pith.science/pith/UIMMJSIDUEPESP4JNCWCYSWX2M/state.json","well_known_bundle":"https://pith.science/.well-known/pith/UIMMJSIDUEPESP4JNCWCYSWX2M/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:UIMMJSIDUEPESP4JNCWCYSWX2M","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d7a071710dd60291e9ec76f0bcb764d31c52f34654b70e42357124c2cb066df7","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DS","submitted_at":"2019-05-29T22:21:47Z","title_canon_sha256":"2be6d3b266f2525ce6b4df24c28bf4c0fc45f2168ea058178011888746c8bbcf"},"schema_version":"1.0","source":{"id":"1905.12753","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1905.12753","created_at":"2026-05-17T23:44:39Z"},{"alias_kind":"arxiv_version","alias_value":"1905.12753v1","created_at":"2026-05-17T23:44:39Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1905.12753","created_at":"2026-05-17T23:44:39Z"},{"alias_kind":"pith_short_12","alias_value":"UIMMJSIDUEPE","created_at":"2026-05-18T12:33:30Z"},{"alias_kind":"pith_short_16","alias_value":"UIMMJSIDUEPESP4J","created_at":"2026-05-18T12:33:30Z"},{"alias_kind":"pith_short_8","alias_value":"UIMMJSID","created_at":"2026-05-18T12:33:30Z"}],"graph_snapshots":[{"event_id":"sha256:d3c3411eaac2ec11385d6884c7af493160b15ba38266040c177b2ef9e70f81b8","target":"graph","created_at":"2026-05-17T23:44:39Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In this paper we consider clustering problems in which each point is endowed with a color. The goal is to cluster the points to minimize the classical clustering cost but with the additional constraint that no color is over-represented in any cluster. This problem is motivated by practical clustering settings, e.g., in clustering news articles where the color of an article is its source, it is preferable that no single news source dominates any cluster.\n  For the most general version of this problem, we obtain an algorithm that has provable guarantees of performance; our algorithm is based on ","authors_text":"Alessandro Epasto, Mohammad Mahdian, Ravi Kumar, Sara Ahmadian","cross_cats":["cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DS","submitted_at":"2019-05-29T22:21:47Z","title":"Clustering without Over-Representation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1905.12753","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:10af9a070267b5b64c772606a11dcd5675045e23eb483d2437ac1999af7c6e77","target":"record","created_at":"2026-05-17T23:44:39Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d7a071710dd60291e9ec76f0bcb764d31c52f34654b70e42357124c2cb066df7","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DS","submitted_at":"2019-05-29T22:21:47Z","title_canon_sha256":"2be6d3b266f2525ce6b4df24c28bf4c0fc45f2168ea058178011888746c8bbcf"},"schema_version":"1.0","source":{"id":"1905.12753","kind":"arxiv","version":1}},"canonical_sha256":"a218c4c903a11e493f8968ac2c4ad7d30d9fb6893cd1aedcf71b4874ba48e6b2","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"a218c4c903a11e493f8968ac2c4ad7d30d9fb6893cd1aedcf71b4874ba48e6b2","first_computed_at":"2026-05-17T23:44:39.737332Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:44:39.737332Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Rx1i7hDdXO9oCCaVPo9GO4atnXJiGjgowTJTzcD+w1+eTRdjYL0R7Di0uzxm/euB6huaNNCsRnB55OtQshJECQ==","signature_status":"signed_v1","signed_at":"2026-05-17T23:44:39.737798Z","signed_message":"canonical_sha256_bytes"},"source_id":"1905.12753","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:10af9a070267b5b64c772606a11dcd5675045e23eb483d2437ac1999af7c6e77","sha256:d3c3411eaac2ec11385d6884c7af493160b15ba38266040c177b2ef9e70f81b8"],"state_sha256":"ca80432b5236fa77ea63dca8827bc340f3e191dd1ba5ef89ab3fbf5d8de189fc"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"88e3TvgczjG77N5qmHlz6fmF4AK92uOS4IMxP1o+xo2pvfocuxdbAmcO/emmajlbNRd4GAXfKHNz2jyUf65KDA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-31T23:04:52.443760Z","bundle_sha256":"b4a434fb8ed0f9b0658dc175c0d8a94d655cc07aeddd47efdce656cc83632fc0"}}