{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:DKXN5H6B4YLB3DP7KL34RPITJZ","short_pith_number":"pith:DKXN5H6B","canonical_record":{"source":{"id":"1604.08897","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2016-04-29T16:05:49Z","cross_cats_sorted":["cs.DL"],"title_canon_sha256":"45b2edc9942373842a671a2225984bd816fb2ae9a86404ffcde1a011ed0e86fd","abstract_canon_sha256":"e79184cad917e5bf3451109c3ee20464238a02c8d38383ac2728cc3c59c91d41"},"schema_version":"1.0"},"canonical_sha256":"1aaede9fc1e6161d8dff52f7c8bd134e6d6551f96e677fd75c5e0becbba7e4f1","source":{"kind":"arxiv","id":"1604.08897","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1604.08897","created_at":"2026-05-18T01:13:47Z"},{"alias_kind":"arxiv_version","alias_value":"1604.08897v2","created_at":"2026-05-18T01:13:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1604.08897","created_at":"2026-05-18T01:13:47Z"},{"alias_kind":"pith_short_12","alias_value":"DKXN5H6B4YLB","created_at":"2026-05-18T12:30:12Z"},{"alias_kind":"pith_short_16","alias_value":"DKXN5H6B4YLB3DP7","created_at":"2026-05-18T12:30:12Z"},{"alias_kind":"pith_short_8","alias_value":"DKXN5H6B","created_at":"2026-05-18T12:30:12Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:DKXN5H6B4YLB3DP7KL34RPITJZ","target":"record","payload":{"canonical_record":{"source":{"id":"1604.08897","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2016-04-29T16:05:49Z","cross_cats_sorted":["cs.DL"],"title_canon_sha256":"45b2edc9942373842a671a2225984bd816fb2ae9a86404ffcde1a011ed0e86fd","abstract_canon_sha256":"e79184cad917e5bf3451109c3ee20464238a02c8d38383ac2728cc3c59c91d41"},"schema_version":"1.0"},"canonical_sha256":"1aaede9fc1e6161d8dff52f7c8bd134e6d6551f96e677fd75c5e0becbba7e4f1","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:13:47.319061Z","signature_b64":"XI3UFsWvJ11FLTwQBBsJIFY8TYlggVGfeipf3j0mvzO+nErSAF/CSUdptlC5pnJR9Jlv4/MQfhbsyMNTHV/cBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"1aaede9fc1e6161d8dff52f7c8bd134e6d6551f96e677fd75c5e0becbba7e4f1","last_reissued_at":"2026-05-18T01:13:47.318450Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:13:47.318450Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1604.08897","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:13:47Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"wj+7m3UoXNLCgGe3gMbQ/ITkaAeZZLIyuNy4ot216ngWmDcO+zPEZrF+P7kJjLZZZqoEFQyuLCHtsnkPEJWBBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T22:38:35.623420Z"},"content_sha256":"0aa4987c9e17ed2985918f0a0f6ecae4a5c33268d904b53ba9f4078c7f86eb9a","schema_version":"1.0","event_id":"sha256:0aa4987c9e17ed2985918f0a0f6ecae4a5c33268d904b53ba9f4078c7f86eb9a"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:DKXN5H6B4YLB3DP7KL34RPITJZ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Universal Indexes for Highly Repetitive Document Collections","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.DL"],"primary_cat":"cs.IR","authors_text":"Antonio Fari\\~na, Francisco Claude, Gonzalo Navarro, Miguel A. Mart\\'inez-Prieto","submitted_at":"2016-04-29T16:05:49Z","abstract_excerpt":"Indexing highly repetitive collections has become a relevant problem with the emergence of large repositories of versioned documents, among other applications. These collections may reach huge sizes, but are formed mostly of documents that are near-copies of others. Traditional techniques for indexing these collections fail to properly exploit their regularities in order to reduce space.\n  We introduce new techniques for compressing inverted indexes that exploit this near-copy regularity. They are based on run-length, Lempel-Ziv, or grammar compression of the differential inverted lists, inste"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1604.08897","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:13:47Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"O8KdCeU476gC01xfKwoqf/NSyhMeNFXeX0OLu1c5i8ZT2OIwLJALGtW3wYDAsfZ1o1LBxkLVjsIftqsFC/XeAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T22:38:35.624174Z"},"content_sha256":"a9ff92c0f5212d98fe105fcdae823bacf0b57beefcd45ea9e0fcb160352ba281","schema_version":"1.0","event_id":"sha256:a9ff92c0f5212d98fe105fcdae823bacf0b57beefcd45ea9e0fcb160352ba281"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/DKXN5H6B4YLB3DP7KL34RPITJZ/bundle.json","state_url":"https://pith.science/pith/DKXN5H6B4YLB3DP7KL34RPITJZ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/DKXN5H6B4YLB3DP7KL34RPITJZ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-31T22:38:35Z","links":{"resolver":"https://pith.science/pith/DKXN5H6B4YLB3DP7KL34RPITJZ","bundle":"https://pith.science/pith/DKXN5H6B4YLB3DP7KL34RPITJZ/bundle.json","state":"https://pith.science/pith/DKXN5H6B4YLB3DP7KL34RPITJZ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/DKXN5H6B4YLB3DP7KL34RPITJZ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:DKXN5H6B4YLB3DP7KL34RPITJZ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e79184cad917e5bf3451109c3ee20464238a02c8d38383ac2728cc3c59c91d41","cross_cats_sorted":["cs.DL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2016-04-29T16:05:49Z","title_canon_sha256":"45b2edc9942373842a671a2225984bd816fb2ae9a86404ffcde1a011ed0e86fd"},"schema_version":"1.0","source":{"id":"1604.08897","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1604.08897","created_at":"2026-05-18T01:13:47Z"},{"alias_kind":"arxiv_version","alias_value":"1604.08897v2","created_at":"2026-05-18T01:13:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1604.08897","created_at":"2026-05-18T01:13:47Z"},{"alias_kind":"pith_short_12","alias_value":"DKXN5H6B4YLB","created_at":"2026-05-18T12:30:12Z"},{"alias_kind":"pith_short_16","alias_value":"DKXN5H6B4YLB3DP7","created_at":"2026-05-18T12:30:12Z"},{"alias_kind":"pith_short_8","alias_value":"DKXN5H6B","created_at":"2026-05-18T12:30:12Z"}],"graph_snapshots":[{"event_id":"sha256:a9ff92c0f5212d98fe105fcdae823bacf0b57beefcd45ea9e0fcb160352ba281","target":"graph","created_at":"2026-05-18T01:13:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Indexing highly repetitive collections has become a relevant problem with the emergence of large repositories of versioned documents, among other applications. These collections may reach huge sizes, but are formed mostly of documents that are near-copies of others. Traditional techniques for indexing these collections fail to properly exploit their regularities in order to reduce space.\n  We introduce new techniques for compressing inverted indexes that exploit this near-copy regularity. They are based on run-length, Lempel-Ziv, or grammar compression of the differential inverted lists, inste","authors_text":"Antonio Fari\\~na, Francisco Claude, Gonzalo Navarro, Miguel A. Mart\\'inez-Prieto","cross_cats":["cs.DL"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2016-04-29T16:05:49Z","title":"Universal Indexes for Highly Repetitive Document Collections"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1604.08897","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:0aa4987c9e17ed2985918f0a0f6ecae4a5c33268d904b53ba9f4078c7f86eb9a","target":"record","created_at":"2026-05-18T01:13:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e79184cad917e5bf3451109c3ee20464238a02c8d38383ac2728cc3c59c91d41","cross_cats_sorted":["cs.DL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2016-04-29T16:05:49Z","title_canon_sha256":"45b2edc9942373842a671a2225984bd816fb2ae9a86404ffcde1a011ed0e86fd"},"schema_version":"1.0","source":{"id":"1604.08897","kind":"arxiv","version":2}},"canonical_sha256":"1aaede9fc1e6161d8dff52f7c8bd134e6d6551f96e677fd75c5e0becbba7e4f1","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"1aaede9fc1e6161d8dff52f7c8bd134e6d6551f96e677fd75c5e0becbba7e4f1","first_computed_at":"2026-05-18T01:13:47.318450Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:13:47.318450Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"XI3UFsWvJ11FLTwQBBsJIFY8TYlggVGfeipf3j0mvzO+nErSAF/CSUdptlC5pnJR9Jlv4/MQfhbsyMNTHV/cBQ==","signature_status":"signed_v1","signed_at":"2026-05-18T01:13:47.319061Z","signed_message":"canonical_sha256_bytes"},"source_id":"1604.08897","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:0aa4987c9e17ed2985918f0a0f6ecae4a5c33268d904b53ba9f4078c7f86eb9a","sha256:a9ff92c0f5212d98fe105fcdae823bacf0b57beefcd45ea9e0fcb160352ba281"],"state_sha256":"2d73a63d9ab17cb104dbc85081f603ded3f13cfaa146845a6633449dce2f906f"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"kG4vh4T40Aqr3v9QvaFdMLCbX6xWDRoYcAMh/qIfZpdei4sbEbMjQfNsbpM5JKUnljBW7GEaNJJ3ySM8TkULDQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-31T22:38:35.627669Z","bundle_sha256":"df153a373cc18d6835b44bb44af7cd70ff0cf6a81cdb260abe849fee41f70269"}}