{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2015:W4N3MTT7LCWSIG3SMTPXCRYVMS","short_pith_number":"pith:W4N3MTT7","canonical_record":{"source":{"id":"1511.08411","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-11-26T15:10:18Z","cross_cats_sorted":[],"title_canon_sha256":"21efe8f90b75b2b3b48006f8fcca2bfc79705acfadba3c64386315453b05c2d8","abstract_canon_sha256":"aab08eccd3e7bb716a04e12db40719c39b383a1a2e41d81607eb1f31efada710"},"schema_version":"1.0"},"canonical_sha256":"b71bb64e7f58ad241b7264df71471564bfec3cdd8b9ea1490cfb3eb42fc71095","source":{"kind":"arxiv","id":"1511.08411","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1511.08411","created_at":"2026-05-18T01:25:54Z"},{"alias_kind":"arxiv_version","alias_value":"1511.08411v1","created_at":"2026-05-18T01:25:54Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1511.08411","created_at":"2026-05-18T01:25:54Z"},{"alias_kind":"pith_short_12","alias_value":"W4N3MTT7LCWS","created_at":"2026-05-18T12:29:47Z"},{"alias_kind":"pith_short_16","alias_value":"W4N3MTT7LCWSIG3S","created_at":"2026-05-18T12:29:47Z"},{"alias_kind":"pith_short_8","alias_value":"W4N3MTT7","created_at":"2026-05-18T12:29:47Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2015:W4N3MTT7LCWSIG3SMTPXCRYVMS","target":"record","payload":{"canonical_record":{"source":{"id":"1511.08411","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-11-26T15:10:18Z","cross_cats_sorted":[],"title_canon_sha256":"21efe8f90b75b2b3b48006f8fcca2bfc79705acfadba3c64386315453b05c2d8","abstract_canon_sha256":"aab08eccd3e7bb716a04e12db40719c39b383a1a2e41d81607eb1f31efada710"},"schema_version":"1.0"},"canonical_sha256":"b71bb64e7f58ad241b7264df71471564bfec3cdd8b9ea1490cfb3eb42fc71095","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:25:54.139499Z","signature_b64":"hyPs2ozuuBMgCwUnlGyJ0mfg2Lr2llZxiDaqS68Usg4FO7s9vMG1g2DYTK/nS2yT2Wst+C5uFDpP9O3sAKPoAg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b71bb64e7f58ad241b7264df71471564bfec3cdd8b9ea1490cfb3eb42fc71095","last_reissued_at":"2026-05-18T01:25:54.138577Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:25:54.138577Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1511.08411","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:25:54Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"XLDukERXNrSBF4gvuSWfe3SY4hwlM1JmXjBxEJAIQVsekpSss0E6cWQf50mxOUmtcV98clLKC4nAL0V/lJX0AQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T14:45:56.372890Z"},"content_sha256":"f0814374113f993e658fa183ba9faeabcb5b9b897a993afadc28d6a95d63e3ba","schema_version":"1.0","event_id":"sha256:f0814374113f993e658fa183ba9faeabcb5b9b897a993afadc28d6a95d63e3ba"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2015:W4N3MTT7LCWSIG3SMTPXCRYVMS","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"OntoSeg: a Novel Approach to Text Segmentation using Ontological Similarity","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Killian Levacher, Mostafa Bayomi, M. Rami Ghorab, S\\'eamus Lawless","submitted_at":"2015-11-26T15:10:18Z","abstract_excerpt":"Text segmentation (TS) aims at dividing long text into coherent segments which reflect the subtopic structure of the text. It is beneficial to many natural language processing tasks, such as Information Retrieval (IR) and document summarisation. Current approaches to text segmentation are similar in that they all use word-frequency metrics to measure the similarity between two regions of text, so that a document is segmented based on the lexical cohesion between its words. Various NLP tasks are now moving towards the semantic web and ontologies, such as ontology-based IR systems, to capture th"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1511.08411","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:25:54Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"CWRPglZsAKekxhR1NHXgSLHPmJG7GjqloHSPh4+Aj7jM9XlFbKbinkwYzfQ5Z/8pzc9hHEDthp7GmAr3RFFaCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T14:45:56.373242Z"},"content_sha256":"c37f763e6ff71a9ec4841b987d0dc6960331487c2d82372bf65976d7d58a748f","schema_version":"1.0","event_id":"sha256:c37f763e6ff71a9ec4841b987d0dc6960331487c2d82372bf65976d7d58a748f"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/W4N3MTT7LCWSIG3SMTPXCRYVMS/bundle.json","state_url":"https://pith.science/pith/W4N3MTT7LCWSIG3SMTPXCRYVMS/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/W4N3MTT7LCWSIG3SMTPXCRYVMS/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-06T14:45:56Z","links":{"resolver":"https://pith.science/pith/W4N3MTT7LCWSIG3SMTPXCRYVMS","bundle":"https://pith.science/pith/W4N3MTT7LCWSIG3SMTPXCRYVMS/bundle.json","state":"https://pith.science/pith/W4N3MTT7LCWSIG3SMTPXCRYVMS/state.json","well_known_bundle":"https://pith.science/.well-known/pith/W4N3MTT7LCWSIG3SMTPXCRYVMS/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2015:W4N3MTT7LCWSIG3SMTPXCRYVMS","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"aab08eccd3e7bb716a04e12db40719c39b383a1a2e41d81607eb1f31efada710","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-11-26T15:10:18Z","title_canon_sha256":"21efe8f90b75b2b3b48006f8fcca2bfc79705acfadba3c64386315453b05c2d8"},"schema_version":"1.0","source":{"id":"1511.08411","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1511.08411","created_at":"2026-05-18T01:25:54Z"},{"alias_kind":"arxiv_version","alias_value":"1511.08411v1","created_at":"2026-05-18T01:25:54Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1511.08411","created_at":"2026-05-18T01:25:54Z"},{"alias_kind":"pith_short_12","alias_value":"W4N3MTT7LCWS","created_at":"2026-05-18T12:29:47Z"},{"alias_kind":"pith_short_16","alias_value":"W4N3MTT7LCWSIG3S","created_at":"2026-05-18T12:29:47Z"},{"alias_kind":"pith_short_8","alias_value":"W4N3MTT7","created_at":"2026-05-18T12:29:47Z"}],"graph_snapshots":[{"event_id":"sha256:c37f763e6ff71a9ec4841b987d0dc6960331487c2d82372bf65976d7d58a748f","target":"graph","created_at":"2026-05-18T01:25:54Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Text segmentation (TS) aims at dividing long text into coherent segments which reflect the subtopic structure of the text. It is beneficial to many natural language processing tasks, such as Information Retrieval (IR) and document summarisation. Current approaches to text segmentation are similar in that they all use word-frequency metrics to measure the similarity between two regions of text, so that a document is segmented based on the lexical cohesion between its words. Various NLP tasks are now moving towards the semantic web and ontologies, such as ontology-based IR systems, to capture th","authors_text":"Killian Levacher, Mostafa Bayomi, M. Rami Ghorab, S\\'eamus Lawless","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-11-26T15:10:18Z","title":"OntoSeg: a Novel Approach to Text Segmentation using Ontological Similarity"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1511.08411","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:f0814374113f993e658fa183ba9faeabcb5b9b897a993afadc28d6a95d63e3ba","target":"record","created_at":"2026-05-18T01:25:54Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"aab08eccd3e7bb716a04e12db40719c39b383a1a2e41d81607eb1f31efada710","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-11-26T15:10:18Z","title_canon_sha256":"21efe8f90b75b2b3b48006f8fcca2bfc79705acfadba3c64386315453b05c2d8"},"schema_version":"1.0","source":{"id":"1511.08411","kind":"arxiv","version":1}},"canonical_sha256":"b71bb64e7f58ad241b7264df71471564bfec3cdd8b9ea1490cfb3eb42fc71095","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"b71bb64e7f58ad241b7264df71471564bfec3cdd8b9ea1490cfb3eb42fc71095","first_computed_at":"2026-05-18T01:25:54.138577Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:25:54.138577Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"hyPs2ozuuBMgCwUnlGyJ0mfg2Lr2llZxiDaqS68Usg4FO7s9vMG1g2DYTK/nS2yT2Wst+C5uFDpP9O3sAKPoAg==","signature_status":"signed_v1","signed_at":"2026-05-18T01:25:54.139499Z","signed_message":"canonical_sha256_bytes"},"source_id":"1511.08411","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:f0814374113f993e658fa183ba9faeabcb5b9b897a993afadc28d6a95d63e3ba","sha256:c37f763e6ff71a9ec4841b987d0dc6960331487c2d82372bf65976d7d58a748f"],"state_sha256":"d3af06ce802ba0d1f3df0479874dd449c57faf57e87287f45ce6a461b08cbea6"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"cKKd4ELXfysq0AbcHE0a3Pczk4RRoAL9+jEfhDq74vVLrL71JAZWZNc0C05rVe9MgtpTERSeMo5IZGwh/v8RCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-06T14:45:56.375263Z","bundle_sha256":"736200d55b6ede177c8a6748318fbfcb922887e6dc08dbe9cd4d085cdde2afbc"}}