{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2014:JCBMZF5IKV5ZQ7N7LFKG2O6246","short_pith_number":"pith:JCBMZF5I","canonical_record":{"source":{"id":"1411.5796","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2014-11-21T08:50:30Z","cross_cats_sorted":[],"title_canon_sha256":"62d68c45e9e855f995e3211c48b708817af7ce994cc88745f5018a4aac4550ef","abstract_canon_sha256":"d8dacfac12e055aabaa7607a21bb9cfea8bc7a9538f74efc931d50c78ae2ff59"},"schema_version":"1.0"},"canonical_sha256":"4882cc97a8557b987dbf59546d3bdae79b9032720a40761e04aeeb6ac6c61be5","source":{"kind":"arxiv","id":"1411.5796","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1411.5796","created_at":"2026-05-18T02:33:07Z"},{"alias_kind":"arxiv_version","alias_value":"1411.5796v1","created_at":"2026-05-18T02:33:07Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1411.5796","created_at":"2026-05-18T02:33:07Z"},{"alias_kind":"pith_short_12","alias_value":"JCBMZF5IKV5Z","created_at":"2026-05-18T12:28:33Z"},{"alias_kind":"pith_short_16","alias_value":"JCBMZF5IKV5ZQ7N7","created_at":"2026-05-18T12:28:33Z"},{"alias_kind":"pith_short_8","alias_value":"JCBMZF5I","created_at":"2026-05-18T12:28:33Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2014:JCBMZF5IKV5ZQ7N7LFKG2O6246","target":"record","payload":{"canonical_record":{"source":{"id":"1411.5796","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2014-11-21T08:50:30Z","cross_cats_sorted":[],"title_canon_sha256":"62d68c45e9e855f995e3211c48b708817af7ce994cc88745f5018a4aac4550ef","abstract_canon_sha256":"d8dacfac12e055aabaa7607a21bb9cfea8bc7a9538f74efc931d50c78ae2ff59"},"schema_version":"1.0"},"canonical_sha256":"4882cc97a8557b987dbf59546d3bdae79b9032720a40761e04aeeb6ac6c61be5","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T02:33:07.076803Z","signature_b64":"uYj8j5u59MKnk7+CzoZi9cesOqBBZkmdVvStumCt0uo+QjLGL8d2P22WK8uHXudNYmOqTA0XUQFeh+0zOo/uDg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"4882cc97a8557b987dbf59546d3bdae79b9032720a40761e04aeeb6ac6c61be5","last_reissued_at":"2026-05-18T02:33:07.076391Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T02:33:07.076391Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1411.5796","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:33:07Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"G3wtndnCdzM2fR0mMnJLvl9Hl8AlHLrrEmLSTeYMaRaml13FMBtKrUjeYzb3HdHGFDlxL7ZpXsalR5ZUZlvVBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-07T06:03:50.182121Z"},"content_sha256":"39eaac8e99581346e1305282e213ed2d83fae0ca89ef3a69c6bd83b98fedb256","schema_version":"1.0","event_id":"sha256:39eaac8e99581346e1305282e213ed2d83fae0ca89ef3a69c6bd83b98fedb256"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2014:JCBMZF5IKV5ZQ7N7LFKG2O6246","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Pre-processing of Domain Ontology Graph Generation System in Punjabi","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Rajveer Kaur, Saurabh Sharma","submitted_at":"2014-11-21T08:50:30Z","abstract_excerpt":"This paper describes pre-processing phase of ontology graph generation system from Punjabi text documents of different domains. This research paper focuses on pre-processing of Punjabi text documents. Pre-processing is structured representation of the input text. Pre-processing of ontology graph generation includes allowing input restrictions to the text, removal of special symbols and punctuation marks, removal of duplicate terms, removal of stop words, extract terms by matching input terms with dictionary and gazetteer lists terms."},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1411.5796","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:33:07Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"qqGAW6ODqmuj+HGxnH2PUuhuhObMiZ2rgtT9JBSn1a5QkAUZIPMfhHxrpAcKALoVEzhEKTMphvCNCVECLQMRAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-07T06:03:50.182482Z"},"content_sha256":"0d60ce5e55371529fd298ccb8faf4b4eba4af5a90c78c677456446f07077bebe","schema_version":"1.0","event_id":"sha256:0d60ce5e55371529fd298ccb8faf4b4eba4af5a90c78c677456446f07077bebe"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/JCBMZF5IKV5ZQ7N7LFKG2O6246/bundle.json","state_url":"https://pith.science/pith/JCBMZF5IKV5ZQ7N7LFKG2O6246/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/JCBMZF5IKV5ZQ7N7LFKG2O6246/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-07T06:03:50Z","links":{"resolver":"https://pith.science/pith/JCBMZF5IKV5ZQ7N7LFKG2O6246","bundle":"https://pith.science/pith/JCBMZF5IKV5ZQ7N7LFKG2O6246/bundle.json","state":"https://pith.science/pith/JCBMZF5IKV5ZQ7N7LFKG2O6246/state.json","well_known_bundle":"https://pith.science/.well-known/pith/JCBMZF5IKV5ZQ7N7LFKG2O6246/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2014:JCBMZF5IKV5ZQ7N7LFKG2O6246","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d8dacfac12e055aabaa7607a21bb9cfea8bc7a9538f74efc931d50c78ae2ff59","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2014-11-21T08:50:30Z","title_canon_sha256":"62d68c45e9e855f995e3211c48b708817af7ce994cc88745f5018a4aac4550ef"},"schema_version":"1.0","source":{"id":"1411.5796","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1411.5796","created_at":"2026-05-18T02:33:07Z"},{"alias_kind":"arxiv_version","alias_value":"1411.5796v1","created_at":"2026-05-18T02:33:07Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1411.5796","created_at":"2026-05-18T02:33:07Z"},{"alias_kind":"pith_short_12","alias_value":"JCBMZF5IKV5Z","created_at":"2026-05-18T12:28:33Z"},{"alias_kind":"pith_short_16","alias_value":"JCBMZF5IKV5ZQ7N7","created_at":"2026-05-18T12:28:33Z"},{"alias_kind":"pith_short_8","alias_value":"JCBMZF5I","created_at":"2026-05-18T12:28:33Z"}],"graph_snapshots":[{"event_id":"sha256:0d60ce5e55371529fd298ccb8faf4b4eba4af5a90c78c677456446f07077bebe","target":"graph","created_at":"2026-05-18T02:33:07Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"This paper describes pre-processing phase of ontology graph generation system from Punjabi text documents of different domains. This research paper focuses on pre-processing of Punjabi text documents. Pre-processing is structured representation of the input text. Pre-processing of ontology graph generation includes allowing input restrictions to the text, removal of special symbols and punctuation marks, removal of duplicate terms, removal of stop words, extract terms by matching input terms with dictionary and gazetteer lists terms.","authors_text":"Rajveer Kaur, Saurabh Sharma","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2014-11-21T08:50:30Z","title":"Pre-processing of Domain Ontology Graph Generation System in Punjabi"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1411.5796","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:39eaac8e99581346e1305282e213ed2d83fae0ca89ef3a69c6bd83b98fedb256","target":"record","created_at":"2026-05-18T02:33:07Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d8dacfac12e055aabaa7607a21bb9cfea8bc7a9538f74efc931d50c78ae2ff59","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2014-11-21T08:50:30Z","title_canon_sha256":"62d68c45e9e855f995e3211c48b708817af7ce994cc88745f5018a4aac4550ef"},"schema_version":"1.0","source":{"id":"1411.5796","kind":"arxiv","version":1}},"canonical_sha256":"4882cc97a8557b987dbf59546d3bdae79b9032720a40761e04aeeb6ac6c61be5","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"4882cc97a8557b987dbf59546d3bdae79b9032720a40761e04aeeb6ac6c61be5","first_computed_at":"2026-05-18T02:33:07.076391Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T02:33:07.076391Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"uYj8j5u59MKnk7+CzoZi9cesOqBBZkmdVvStumCt0uo+QjLGL8d2P22WK8uHXudNYmOqTA0XUQFeh+0zOo/uDg==","signature_status":"signed_v1","signed_at":"2026-05-18T02:33:07.076803Z","signed_message":"canonical_sha256_bytes"},"source_id":"1411.5796","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:39eaac8e99581346e1305282e213ed2d83fae0ca89ef3a69c6bd83b98fedb256","sha256:0d60ce5e55371529fd298ccb8faf4b4eba4af5a90c78c677456446f07077bebe"],"state_sha256":"9efa81249b614e834633a7d6e6928884eeff337e6dbfde5f9c6942b1a7f8aca3"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"5TLXPzZ9EhdGecpkTP76Yr7tC1FVECX+E8geogu3qhxe7UUq2stBrhC3n84mdAR4hAsQ9CiAh91UyMO1rwT9CQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-07T06:03:50.184620Z","bundle_sha256":"4f786ae7ddd162db2cca6199cb9a9cdcfd0c0e18bfd479d12a3ff2a806ad46e0"}}