{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2014:C4TI3TLFMZF7AEHVAXSJOY5KIN","short_pith_number":"pith:C4TI3TLF","canonical_record":{"source":{"id":"1401.6571","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2014-01-25T19:05:45Z","cross_cats_sorted":["cs.IR"],"title_canon_sha256":"e83d1bc21c1a24406d5dd68278fd6f5d424eb43af25d51ffd316990437582922","abstract_canon_sha256":"0d7dc7f6330fae92fe9e7667ed5c3b8fc59c2ee30d9dd283786f8accade81e6f"},"schema_version":"1.0"},"canonical_sha256":"17268dcd65664bf010f505e49763aa436ebaf7f59ed635e5e76a7ae0082b8379","source":{"kind":"arxiv","id":"1401.6571","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1401.6571","created_at":"2026-05-18T03:01:01Z"},{"alias_kind":"arxiv_version","alias_value":"1401.6571v1","created_at":"2026-05-18T03:01:01Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1401.6571","created_at":"2026-05-18T03:01:01Z"},{"alias_kind":"pith_short_12","alias_value":"C4TI3TLFMZF7","created_at":"2026-05-18T12:28:22Z"},{"alias_kind":"pith_short_16","alias_value":"C4TI3TLFMZF7AEHV","created_at":"2026-05-18T12:28:22Z"},{"alias_kind":"pith_short_8","alias_value":"C4TI3TLF","created_at":"2026-05-18T12:28:22Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2014:C4TI3TLFMZF7AEHVAXSJOY5KIN","target":"record","payload":{"canonical_record":{"source":{"id":"1401.6571","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2014-01-25T19:05:45Z","cross_cats_sorted":["cs.IR"],"title_canon_sha256":"e83d1bc21c1a24406d5dd68278fd6f5d424eb43af25d51ffd316990437582922","abstract_canon_sha256":"0d7dc7f6330fae92fe9e7667ed5c3b8fc59c2ee30d9dd283786f8accade81e6f"},"schema_version":"1.0"},"canonical_sha256":"17268dcd65664bf010f505e49763aa436ebaf7f59ed635e5e76a7ae0082b8379","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T03:01:01.310822Z","signature_b64":"QckRuF9KGWFLsuIMVU2O/FO+2qFz+rgt3GQ+s3ZyZPCrOslMsLaTSl2itOkbwAnoBhmmy8tpjifZ/CmQaxB2Cg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"17268dcd65664bf010f505e49763aa436ebaf7f59ed635e5e76a7ae0082b8379","last_reissued_at":"2026-05-18T03:01:01.310287Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T03:01:01.310287Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1401.6571","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T03:01:01Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"UW2v1vg6nk6wccJEq24mXk9yeqRbfG4t0SSHhdPS4v5K4GRrI0bdHJRFwYZFVnMlztO24ejdjYOSYdA90dwJBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T19:48:28.413463Z"},"content_sha256":"ffa2dfb61b052226a69c5a8aa6183c23479876d6525db7f732816a9cbabc3358","schema_version":"1.0","event_id":"sha256:ffa2dfb61b052226a69c5a8aa6183c23479876d6525db7f732816a9cbabc3358"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2014:C4TI3TLFMZF7AEHVAXSJOY5KIN","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Keyword and Keyphrase Extraction Using Centrality Measures on Collocation Networks","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.IR"],"primary_cat":"cs.CL","authors_text":"Cornelia Caragea, Sagnik Ray Choudhury, Shibamouli Lahiri","submitted_at":"2014-01-25T19:05:45Z","abstract_excerpt":"Keyword and keyphrase extraction is an important problem in natural language processing, with applications ranging from summarization to semantic search to document clustering. Graph-based approaches to keyword and keyphrase extraction avoid the problem of acquiring a large in-domain training corpus by applying variants of PageRank algorithm on a network of words. Although graph-based approaches are knowledge-lean and easily adoptable in online systems, it remains largely open whether they can benefit from centrality measures other than PageRank. In this paper, we experiment with an array of c"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1401.6571","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T03:01:01Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"iwLkzeWDjbdXl880jxYwH3PRo9D0l1flXtvLWzMwKxurllWUibQQyeE8ThTsGT/4Bk7JmtaHiJe56QxqBmhjAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T19:48:28.414174Z"},"content_sha256":"f0736696b17652de64cabe9c34f7d64e6e03668f250b6ce23515b52bf5ca2531","schema_version":"1.0","event_id":"sha256:f0736696b17652de64cabe9c34f7d64e6e03668f250b6ce23515b52bf5ca2531"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/C4TI3TLFMZF7AEHVAXSJOY5KIN/bundle.json","state_url":"https://pith.science/pith/C4TI3TLFMZF7AEHVAXSJOY5KIN/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/C4TI3TLFMZF7AEHVAXSJOY5KIN/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-31T19:48:28Z","links":{"resolver":"https://pith.science/pith/C4TI3TLFMZF7AEHVAXSJOY5KIN","bundle":"https://pith.science/pith/C4TI3TLFMZF7AEHVAXSJOY5KIN/bundle.json","state":"https://pith.science/pith/C4TI3TLFMZF7AEHVAXSJOY5KIN/state.json","well_known_bundle":"https://pith.science/.well-known/pith/C4TI3TLFMZF7AEHVAXSJOY5KIN/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2014:C4TI3TLFMZF7AEHVAXSJOY5KIN","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"0d7dc7f6330fae92fe9e7667ed5c3b8fc59c2ee30d9dd283786f8accade81e6f","cross_cats_sorted":["cs.IR"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2014-01-25T19:05:45Z","title_canon_sha256":"e83d1bc21c1a24406d5dd68278fd6f5d424eb43af25d51ffd316990437582922"},"schema_version":"1.0","source":{"id":"1401.6571","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1401.6571","created_at":"2026-05-18T03:01:01Z"},{"alias_kind":"arxiv_version","alias_value":"1401.6571v1","created_at":"2026-05-18T03:01:01Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1401.6571","created_at":"2026-05-18T03:01:01Z"},{"alias_kind":"pith_short_12","alias_value":"C4TI3TLFMZF7","created_at":"2026-05-18T12:28:22Z"},{"alias_kind":"pith_short_16","alias_value":"C4TI3TLFMZF7AEHV","created_at":"2026-05-18T12:28:22Z"},{"alias_kind":"pith_short_8","alias_value":"C4TI3TLF","created_at":"2026-05-18T12:28:22Z"}],"graph_snapshots":[{"event_id":"sha256:f0736696b17652de64cabe9c34f7d64e6e03668f250b6ce23515b52bf5ca2531","target":"graph","created_at":"2026-05-18T03:01:01Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Keyword and keyphrase extraction is an important problem in natural language processing, with applications ranging from summarization to semantic search to document clustering. Graph-based approaches to keyword and keyphrase extraction avoid the problem of acquiring a large in-domain training corpus by applying variants of PageRank algorithm on a network of words. Although graph-based approaches are knowledge-lean and easily adoptable in online systems, it remains largely open whether they can benefit from centrality measures other than PageRank. In this paper, we experiment with an array of c","authors_text":"Cornelia Caragea, Sagnik Ray Choudhury, Shibamouli Lahiri","cross_cats":["cs.IR"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2014-01-25T19:05:45Z","title":"Keyword and Keyphrase Extraction Using Centrality Measures on Collocation Networks"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1401.6571","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ffa2dfb61b052226a69c5a8aa6183c23479876d6525db7f732816a9cbabc3358","target":"record","created_at":"2026-05-18T03:01:01Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"0d7dc7f6330fae92fe9e7667ed5c3b8fc59c2ee30d9dd283786f8accade81e6f","cross_cats_sorted":["cs.IR"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2014-01-25T19:05:45Z","title_canon_sha256":"e83d1bc21c1a24406d5dd68278fd6f5d424eb43af25d51ffd316990437582922"},"schema_version":"1.0","source":{"id":"1401.6571","kind":"arxiv","version":1}},"canonical_sha256":"17268dcd65664bf010f505e49763aa436ebaf7f59ed635e5e76a7ae0082b8379","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"17268dcd65664bf010f505e49763aa436ebaf7f59ed635e5e76a7ae0082b8379","first_computed_at":"2026-05-18T03:01:01.310287Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T03:01:01.310287Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"QckRuF9KGWFLsuIMVU2O/FO+2qFz+rgt3GQ+s3ZyZPCrOslMsLaTSl2itOkbwAnoBhmmy8tpjifZ/CmQaxB2Cg==","signature_status":"signed_v1","signed_at":"2026-05-18T03:01:01.310822Z","signed_message":"canonical_sha256_bytes"},"source_id":"1401.6571","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ffa2dfb61b052226a69c5a8aa6183c23479876d6525db7f732816a9cbabc3358","sha256:f0736696b17652de64cabe9c34f7d64e6e03668f250b6ce23515b52bf5ca2531"],"state_sha256":"17e87651ca302ea1b0af9244d061077d2ce05bd2d0453856769fc855f426a5f0"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"YdQywy/3VEfwRqBsmunwPIaG9RMzTFeFot1Fe6N3Q2DeCyeY/hwhxDyP3AiZb77ZFDEitelgpC7R4aZKiESQDA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-31T19:48:28.418788Z","bundle_sha256":"dc11a83e56576d9228b4690f3f6461d7369e5efcd4998b32261eba55dbea11bc"}}