{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2014:BFTYCJSUTRGX3SIXNVPLWLQ3VJ","short_pith_number":"pith:BFTYCJSU","canonical_record":{"source":{"id":"1406.5616","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2014-06-21T14:33:09Z","cross_cats_sorted":[],"title_canon_sha256":"0971f251522ab4c435bc34d78781ef7c914c8be363cadddbaf68d7f31c8d0b92","abstract_canon_sha256":"eab42655b721a2a450f57bc7ae746b8c965e3d19ebbdf2ffe8f85781cd60a3c8"},"schema_version":"1.0"},"canonical_sha256":"09678126549c4d7dc9176d5ebb2e1baa67ca8eaecc15f04a49ac8f886738ca91","source":{"kind":"arxiv","id":"1406.5616","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1406.5616","created_at":"2026-05-18T02:49:11Z"},{"alias_kind":"arxiv_version","alias_value":"1406.5616v1","created_at":"2026-05-18T02:49:11Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1406.5616","created_at":"2026-05-18T02:49:11Z"},{"alias_kind":"pith_short_12","alias_value":"BFTYCJSUTRGX","created_at":"2026-05-18T12:28:22Z"},{"alias_kind":"pith_short_16","alias_value":"BFTYCJSUTRGX3SIX","created_at":"2026-05-18T12:28:22Z"},{"alias_kind":"pith_short_8","alias_value":"BFTYCJSU","created_at":"2026-05-18T12:28:22Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2014:BFTYCJSUTRGX3SIXNVPLWLQ3VJ","target":"record","payload":{"canonical_record":{"source":{"id":"1406.5616","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2014-06-21T14:33:09Z","cross_cats_sorted":[],"title_canon_sha256":"0971f251522ab4c435bc34d78781ef7c914c8be363cadddbaf68d7f31c8d0b92","abstract_canon_sha256":"eab42655b721a2a450f57bc7ae746b8c965e3d19ebbdf2ffe8f85781cd60a3c8"},"schema_version":"1.0"},"canonical_sha256":"09678126549c4d7dc9176d5ebb2e1baa67ca8eaecc15f04a49ac8f886738ca91","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T02:49:11.137785Z","signature_b64":"xuDeb8fm1PLt+/sbFkC5b5xGf3ppPCUPs5mIeKnci3uqM4jGIOU/JiaX9MANaj28QLnjhDHnFtzUsGWOG8uTBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"09678126549c4d7dc9176d5ebb2e1baa67ca8eaecc15f04a49ac8f886738ca91","last_reissued_at":"2026-05-18T02:49:11.137343Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T02:49:11.137343Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1406.5616","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:49:11Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"phoGWB1ecWMyf6BXRNjueLi23TIQgSCJo7kSCn7zNAJT5344jXQrpoQAhy5USoJ1oif797Egyt6j2uqVg/7OAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-02T20:20:24.150916Z"},"content_sha256":"2bfcda3a7095b78e1f2876561e3e6b4d2c050aa3cfe5b25d2a56f85015a11279","schema_version":"1.0","event_id":"sha256:2bfcda3a7095b78e1f2876561e3e6b4d2c050aa3cfe5b25d2a56f85015a11279"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2014:BFTYCJSUTRGX3SIXNVPLWLQ3VJ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"An Effective Approach for Web Document Classification using the Concept of Association Analysis of Data Mining","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.IR","authors_text":"R.K. Roul, S.K. Sahay","submitted_at":"2014-06-21T14:33:09Z","abstract_excerpt":"Exponential growth of the web increased the importance of web document classification and data mining. To get the exact information, in the form of knowing what classes a web document belongs to, is expensive. Automatic classification of web document is of great use to search engines which provides this information at a low cost. In this paper, we propose an approach for classifying the web document using the frequent item word sets generated by the Frequent Pattern (FP) Growth which is an association analysis technique of data mining. These set of associated words act as feature set. The fina"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1406.5616","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:49:11Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"VK4bogicv3+TOmrSWrES+1gu04b8aSAnIvUleFL5sZdmiVP3YQyNmvwAvpLxTluQpaxFDF/zcbQGOu9HiSkYBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-02T20:20:24.151255Z"},"content_sha256":"d8c31b57aaaf86caf5a6c221b34e32a86db94d3a146623ac96abad894b1aeef1","schema_version":"1.0","event_id":"sha256:d8c31b57aaaf86caf5a6c221b34e32a86db94d3a146623ac96abad894b1aeef1"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/BFTYCJSUTRGX3SIXNVPLWLQ3VJ/bundle.json","state_url":"https://pith.science/pith/BFTYCJSUTRGX3SIXNVPLWLQ3VJ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/BFTYCJSUTRGX3SIXNVPLWLQ3VJ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-02T20:20:24Z","links":{"resolver":"https://pith.science/pith/BFTYCJSUTRGX3SIXNVPLWLQ3VJ","bundle":"https://pith.science/pith/BFTYCJSUTRGX3SIXNVPLWLQ3VJ/bundle.json","state":"https://pith.science/pith/BFTYCJSUTRGX3SIXNVPLWLQ3VJ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/BFTYCJSUTRGX3SIXNVPLWLQ3VJ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2014:BFTYCJSUTRGX3SIXNVPLWLQ3VJ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"eab42655b721a2a450f57bc7ae746b8c965e3d19ebbdf2ffe8f85781cd60a3c8","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2014-06-21T14:33:09Z","title_canon_sha256":"0971f251522ab4c435bc34d78781ef7c914c8be363cadddbaf68d7f31c8d0b92"},"schema_version":"1.0","source":{"id":"1406.5616","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1406.5616","created_at":"2026-05-18T02:49:11Z"},{"alias_kind":"arxiv_version","alias_value":"1406.5616v1","created_at":"2026-05-18T02:49:11Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1406.5616","created_at":"2026-05-18T02:49:11Z"},{"alias_kind":"pith_short_12","alias_value":"BFTYCJSUTRGX","created_at":"2026-05-18T12:28:22Z"},{"alias_kind":"pith_short_16","alias_value":"BFTYCJSUTRGX3SIX","created_at":"2026-05-18T12:28:22Z"},{"alias_kind":"pith_short_8","alias_value":"BFTYCJSU","created_at":"2026-05-18T12:28:22Z"}],"graph_snapshots":[{"event_id":"sha256:d8c31b57aaaf86caf5a6c221b34e32a86db94d3a146623ac96abad894b1aeef1","target":"graph","created_at":"2026-05-18T02:49:11Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Exponential growth of the web increased the importance of web document classification and data mining. To get the exact information, in the form of knowing what classes a web document belongs to, is expensive. Automatic classification of web document is of great use to search engines which provides this information at a low cost. In this paper, we propose an approach for classifying the web document using the frequent item word sets generated by the Frequent Pattern (FP) Growth which is an association analysis technique of data mining. These set of associated words act as feature set. The fina","authors_text":"R.K. Roul, S.K. Sahay","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2014-06-21T14:33:09Z","title":"An Effective Approach for Web Document Classification using the Concept of Association Analysis of Data Mining"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1406.5616","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:2bfcda3a7095b78e1f2876561e3e6b4d2c050aa3cfe5b25d2a56f85015a11279","target":"record","created_at":"2026-05-18T02:49:11Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"eab42655b721a2a450f57bc7ae746b8c965e3d19ebbdf2ffe8f85781cd60a3c8","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2014-06-21T14:33:09Z","title_canon_sha256":"0971f251522ab4c435bc34d78781ef7c914c8be363cadddbaf68d7f31c8d0b92"},"schema_version":"1.0","source":{"id":"1406.5616","kind":"arxiv","version":1}},"canonical_sha256":"09678126549c4d7dc9176d5ebb2e1baa67ca8eaecc15f04a49ac8f886738ca91","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"09678126549c4d7dc9176d5ebb2e1baa67ca8eaecc15f04a49ac8f886738ca91","first_computed_at":"2026-05-18T02:49:11.137343Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T02:49:11.137343Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"xuDeb8fm1PLt+/sbFkC5b5xGf3ppPCUPs5mIeKnci3uqM4jGIOU/JiaX9MANaj28QLnjhDHnFtzUsGWOG8uTBw==","signature_status":"signed_v1","signed_at":"2026-05-18T02:49:11.137785Z","signed_message":"canonical_sha256_bytes"},"source_id":"1406.5616","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:2bfcda3a7095b78e1f2876561e3e6b4d2c050aa3cfe5b25d2a56f85015a11279","sha256:d8c31b57aaaf86caf5a6c221b34e32a86db94d3a146623ac96abad894b1aeef1"],"state_sha256":"442a4b4f864d65ce6ec7fb3b78f09323ef1e435f153bfc12e6330208b045f6e6"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"DEqUGE1uPOGLNZUl8qMDPtaKYso29QZQvRixPTTGlxGEzGntugjdx1fVXuxrVjKX+MWcYkLinKZCrn4n60i/CA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-02T20:20:24.153125Z","bundle_sha256":"d23f69f212726b8252dc21db3529ed99be1bd387ab5804f2504dbb444941b215"}}