{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2014:C4TI3TLFMZF7AEHVAXSJOY5KIN","short_pith_number":"pith:C4TI3TLF","schema_version":"1.0","canonical_sha256":"17268dcd65664bf010f505e49763aa436ebaf7f59ed635e5e76a7ae0082b8379","source":{"kind":"arxiv","id":"1401.6571","version":1},"attestation_state":"computed","paper":{"title":"Keyword and Keyphrase Extraction Using Centrality Measures on Collocation Networks","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.IR"],"primary_cat":"cs.CL","authors_text":"Cornelia Caragea, Sagnik Ray Choudhury, Shibamouli Lahiri","submitted_at":"2014-01-25T19:05:45Z","abstract_excerpt":"Keyword and keyphrase extraction is an important problem in natural language processing, with applications ranging from summarization to semantic search to document clustering. Graph-based approaches to keyword and keyphrase extraction avoid the problem of acquiring a large in-domain training corpus by applying variants of PageRank algorithm on a network of words. Although graph-based approaches are knowledge-lean and easily adoptable in online systems, it remains largely open whether they can benefit from centrality measures other than PageRank. In this paper, we experiment with an array of c"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1401.6571","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2014-01-25T19:05:45Z","cross_cats_sorted":["cs.IR"],"title_canon_sha256":"e83d1bc21c1a24406d5dd68278fd6f5d424eb43af25d51ffd316990437582922","abstract_canon_sha256":"0d7dc7f6330fae92fe9e7667ed5c3b8fc59c2ee30d9dd283786f8accade81e6f"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T03:01:01.310822Z","signature_b64":"QckRuF9KGWFLsuIMVU2O/FO+2qFz+rgt3GQ+s3ZyZPCrOslMsLaTSl2itOkbwAnoBhmmy8tpjifZ/CmQaxB2Cg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"17268dcd65664bf010f505e49763aa436ebaf7f59ed635e5e76a7ae0082b8379","last_reissued_at":"2026-05-18T03:01:01.310287Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T03:01:01.310287Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Keyword and Keyphrase Extraction Using Centrality Measures on Collocation Networks","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.IR"],"primary_cat":"cs.CL","authors_text":"Cornelia Caragea, Sagnik Ray Choudhury, Shibamouli Lahiri","submitted_at":"2014-01-25T19:05:45Z","abstract_excerpt":"Keyword and keyphrase extraction is an important problem in natural language processing, with applications ranging from summarization to semantic search to document clustering. Graph-based approaches to keyword and keyphrase extraction avoid the problem of acquiring a large in-domain training corpus by applying variants of PageRank algorithm on a network of words. Although graph-based approaches are knowledge-lean and easily adoptable in online systems, it remains largely open whether they can benefit from centrality measures other than PageRank. In this paper, we experiment with an array of c"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1401.6571","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1401.6571","created_at":"2026-05-18T03:01:01.310376+00:00"},{"alias_kind":"arxiv_version","alias_value":"1401.6571v1","created_at":"2026-05-18T03:01:01.310376+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1401.6571","created_at":"2026-05-18T03:01:01.310376+00:00"},{"alias_kind":"pith_short_12","alias_value":"C4TI3TLFMZF7","created_at":"2026-05-18T12:28:22.404517+00:00"},{"alias_kind":"pith_short_16","alias_value":"C4TI3TLFMZF7AEHV","created_at":"2026-05-18T12:28:22.404517+00:00"},{"alias_kind":"pith_short_8","alias_value":"C4TI3TLF","created_at":"2026-05-18T12:28:22.404517+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/C4TI3TLFMZF7AEHVAXSJOY5KIN","json":"https://pith.science/pith/C4TI3TLFMZF7AEHVAXSJOY5KIN.json","graph_json":"https://pith.science/api/pith-number/C4TI3TLFMZF7AEHVAXSJOY5KIN/graph.json","events_json":"https://pith.science/api/pith-number/C4TI3TLFMZF7AEHVAXSJOY5KIN/events.json","paper":"https://pith.science/paper/C4TI3TLF"},"agent_actions":{"view_html":"https://pith.science/pith/C4TI3TLFMZF7AEHVAXSJOY5KIN","download_json":"https://pith.science/pith/C4TI3TLFMZF7AEHVAXSJOY5KIN.json","view_paper":"https://pith.science/paper/C4TI3TLF","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1401.6571&json=true","fetch_graph":"https://pith.science/api/pith-number/C4TI3TLFMZF7AEHVAXSJOY5KIN/graph.json","fetch_events":"https://pith.science/api/pith-number/C4TI3TLFMZF7AEHVAXSJOY5KIN/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/C4TI3TLFMZF7AEHVAXSJOY5KIN/action/timestamp_anchor","attest_storage":"https://pith.science/pith/C4TI3TLFMZF7AEHVAXSJOY5KIN/action/storage_attestation","attest_author":"https://pith.science/pith/C4TI3TLFMZF7AEHVAXSJOY5KIN/action/author_attestation","sign_citation":"https://pith.science/pith/C4TI3TLFMZF7AEHVAXSJOY5KIN/action/citation_signature","submit_replication":"https://pith.science/pith/C4TI3TLFMZF7AEHVAXSJOY5KIN/action/replication_record"}},"created_at":"2026-05-18T03:01:01.310376+00:00","updated_at":"2026-05-18T03:01:01.310376+00:00"}