{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2012:XGZ66BDBKU7R2WBZGM3QTU74SP","short_pith_number":"pith:XGZ66BDB","canonical_record":{"source":{"id":"1212.5423","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2012-12-21T13:25:00Z","cross_cats_sorted":["cs.DL","stat.ML"],"title_canon_sha256":"f9913bbce01fc4003c533bb1cac09093468a790be9e214e6b33009e6e0ebb3ed","abstract_canon_sha256":"e2b73f4b965b7fc612308142afcbbe9f4f76a7dc58cd26ddf800b5b6233e8600"},"schema_version":"1.0"},"canonical_sha256":"b9b3ef0461553f1d5839333709d3fc93cf9d628381b1c34cde7c93b4c565f5e3","source":{"kind":"arxiv","id":"1212.5423","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1212.5423","created_at":"2026-05-18T02:17:22Z"},{"alias_kind":"arxiv_version","alias_value":"1212.5423v2","created_at":"2026-05-18T02:17:22Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1212.5423","created_at":"2026-05-18T02:17:22Z"},{"alias_kind":"pith_short_12","alias_value":"XGZ66BDBKU7R","created_at":"2026-05-18T12:27:27Z"},{"alias_kind":"pith_short_16","alias_value":"XGZ66BDBKU7R2WBZ","created_at":"2026-05-18T12:27:27Z"},{"alias_kind":"pith_short_8","alias_value":"XGZ66BDB","created_at":"2026-05-18T12:27:27Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2012:XGZ66BDBKU7R2WBZGM3QTU74SP","target":"record","payload":{"canonical_record":{"source":{"id":"1212.5423","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2012-12-21T13:25:00Z","cross_cats_sorted":["cs.DL","stat.ML"],"title_canon_sha256":"f9913bbce01fc4003c533bb1cac09093468a790be9e214e6b33009e6e0ebb3ed","abstract_canon_sha256":"e2b73f4b965b7fc612308142afcbbe9f4f76a7dc58cd26ddf800b5b6233e8600"},"schema_version":"1.0"},"canonical_sha256":"b9b3ef0461553f1d5839333709d3fc93cf9d628381b1c34cde7c93b4c565f5e3","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T02:17:22.126937Z","signature_b64":"YfX+ebMMJmajoi5Le3881YBAe5Up5+NwctW5XjIe0tXy6FyOTgtaTmwl2F/J+7UnWNt6ZJuACXoiDhgSQkmrDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b9b3ef0461553f1d5839333709d3fc93cf9d628381b1c34cde7c93b4c565f5e3","last_reissued_at":"2026-05-18T02:17:22.126220Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T02:17:22.126220Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1212.5423","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:17:22Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"IOF4mslFAEjH4DUMZYAlx1RAdcbhpKeu+JHl/bTpdtANeVc1CG12VWhrKhWJnBSrTxDDW5dY3CYxZuE5xnc5Ag==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T01:14:55.070767Z"},"content_sha256":"6ed88fdd7512accdafe42380c0e773f8f9da8a705d73e7aa0ae33a7536b95b67","schema_version":"1.0","event_id":"sha256:6ed88fdd7512accdafe42380c0e773f8f9da8a705d73e7aa0ae33a7536b95b67"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2012:XGZ66BDBKU7R2WBZGM3QTU74SP","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Topic Extraction and Bundling of Related Scientific Articles","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.DL","stat.ML"],"primary_cat":"cs.IR","authors_text":"Shameem A Puthiya Parambath","submitted_at":"2012-12-21T13:25:00Z","abstract_excerpt":"Automatic classification of scientific articles based on common characteristics is an interesting problem with many applications in digital library and information retrieval systems. Properly organized articles can be useful for automatic generation of taxonomies in scientific writings, textual summarization, efficient information retrieval etc. Generating article bundles from a large number of input articles, based on the associated features of the articles is tedious and computationally expensive task. In this report we propose an automatic two-step approach for topic extraction and bundling"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1212.5423","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:17:22Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"pg8Y2VvjU2m5OVZ10MW39/vA2fwHds6WYYKEuQmYCKzRC/o8ERm6ED8A1mJ1J18HxbcQ+ZPjWHUVEObSRL7+AA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T01:14:55.071122Z"},"content_sha256":"1b571717e454e5b18b5e74e2deb7800f4c75881ae00a11ec441f100916018b7f","schema_version":"1.0","event_id":"sha256:1b571717e454e5b18b5e74e2deb7800f4c75881ae00a11ec441f100916018b7f"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/XGZ66BDBKU7R2WBZGM3QTU74SP/bundle.json","state_url":"https://pith.science/pith/XGZ66BDBKU7R2WBZGM3QTU74SP/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/XGZ66BDBKU7R2WBZGM3QTU74SP/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-06T01:14:55Z","links":{"resolver":"https://pith.science/pith/XGZ66BDBKU7R2WBZGM3QTU74SP","bundle":"https://pith.science/pith/XGZ66BDBKU7R2WBZGM3QTU74SP/bundle.json","state":"https://pith.science/pith/XGZ66BDBKU7R2WBZGM3QTU74SP/state.json","well_known_bundle":"https://pith.science/.well-known/pith/XGZ66BDBKU7R2WBZGM3QTU74SP/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2012:XGZ66BDBKU7R2WBZGM3QTU74SP","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e2b73f4b965b7fc612308142afcbbe9f4f76a7dc58cd26ddf800b5b6233e8600","cross_cats_sorted":["cs.DL","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2012-12-21T13:25:00Z","title_canon_sha256":"f9913bbce01fc4003c533bb1cac09093468a790be9e214e6b33009e6e0ebb3ed"},"schema_version":"1.0","source":{"id":"1212.5423","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1212.5423","created_at":"2026-05-18T02:17:22Z"},{"alias_kind":"arxiv_version","alias_value":"1212.5423v2","created_at":"2026-05-18T02:17:22Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1212.5423","created_at":"2026-05-18T02:17:22Z"},{"alias_kind":"pith_short_12","alias_value":"XGZ66BDBKU7R","created_at":"2026-05-18T12:27:27Z"},{"alias_kind":"pith_short_16","alias_value":"XGZ66BDBKU7R2WBZ","created_at":"2026-05-18T12:27:27Z"},{"alias_kind":"pith_short_8","alias_value":"XGZ66BDB","created_at":"2026-05-18T12:27:27Z"}],"graph_snapshots":[{"event_id":"sha256:1b571717e454e5b18b5e74e2deb7800f4c75881ae00a11ec441f100916018b7f","target":"graph","created_at":"2026-05-18T02:17:22Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Automatic classification of scientific articles based on common characteristics is an interesting problem with many applications in digital library and information retrieval systems. Properly organized articles can be useful for automatic generation of taxonomies in scientific writings, textual summarization, efficient information retrieval etc. Generating article bundles from a large number of input articles, based on the associated features of the articles is tedious and computationally expensive task. In this report we propose an automatic two-step approach for topic extraction and bundling","authors_text":"Shameem A Puthiya Parambath","cross_cats":["cs.DL","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2012-12-21T13:25:00Z","title":"Topic Extraction and Bundling of Related Scientific Articles"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1212.5423","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:6ed88fdd7512accdafe42380c0e773f8f9da8a705d73e7aa0ae33a7536b95b67","target":"record","created_at":"2026-05-18T02:17:22Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e2b73f4b965b7fc612308142afcbbe9f4f76a7dc58cd26ddf800b5b6233e8600","cross_cats_sorted":["cs.DL","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2012-12-21T13:25:00Z","title_canon_sha256":"f9913bbce01fc4003c533bb1cac09093468a790be9e214e6b33009e6e0ebb3ed"},"schema_version":"1.0","source":{"id":"1212.5423","kind":"arxiv","version":2}},"canonical_sha256":"b9b3ef0461553f1d5839333709d3fc93cf9d628381b1c34cde7c93b4c565f5e3","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"b9b3ef0461553f1d5839333709d3fc93cf9d628381b1c34cde7c93b4c565f5e3","first_computed_at":"2026-05-18T02:17:22.126220Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T02:17:22.126220Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"YfX+ebMMJmajoi5Le3881YBAe5Up5+NwctW5XjIe0tXy6FyOTgtaTmwl2F/J+7UnWNt6ZJuACXoiDhgSQkmrDw==","signature_status":"signed_v1","signed_at":"2026-05-18T02:17:22.126937Z","signed_message":"canonical_sha256_bytes"},"source_id":"1212.5423","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:6ed88fdd7512accdafe42380c0e773f8f9da8a705d73e7aa0ae33a7536b95b67","sha256:1b571717e454e5b18b5e74e2deb7800f4c75881ae00a11ec441f100916018b7f"],"state_sha256":"a1fe24e86045a208a69ffca62b49e789da5e890d8f88c1680826351fce04e09f"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"XEs8oTN0XsH6Yh3zUL/nrecKbi4QMTma4/Xgm9z66CVDzvDtP1AOZB9Z6q3vLydZMrSFVjxt3mvJrDK8VF2VDw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-06T01:14:55.073206Z","bundle_sha256":"cf1cc2a83389d822cc2d632d2a862eeef05f2fb3865791b1df971878f46c6300"}}