{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:4KSVXGVTXLLJRUOVZ7ASNZTJQX","short_pith_number":"pith:4KSVXGVT","canonical_record":{"source":{"id":"1808.08850","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-08-27T14:02:58Z","cross_cats_sorted":[],"title_canon_sha256":"95709a21b27edecab4b327e6d884b4439a0dc34e545ca60b14052b171b360081","abstract_canon_sha256":"5271759ead9ff167e6bcfa11f1aa89a180e61e37ee4c5392c70345e8d026187c"},"schema_version":"1.0"},"canonical_sha256":"e2a55b9ab3bad698d1d5cfc126e66985c794a8f4a2690283ecc1ff29d36c4b92","source":{"kind":"arxiv","id":"1808.08850","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1808.08850","created_at":"2026-05-18T00:07:13Z"},{"alias_kind":"arxiv_version","alias_value":"1808.08850v1","created_at":"2026-05-18T00:07:13Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1808.08850","created_at":"2026-05-18T00:07:13Z"},{"alias_kind":"pith_short_12","alias_value":"4KSVXGVTXLLJ","created_at":"2026-05-18T12:32:05Z"},{"alias_kind":"pith_short_16","alias_value":"4KSVXGVTXLLJRUOV","created_at":"2026-05-18T12:32:05Z"},{"alias_kind":"pith_short_8","alias_value":"4KSVXGVT","created_at":"2026-05-18T12:32:05Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:4KSVXGVTXLLJRUOVZ7ASNZTJQX","target":"record","payload":{"canonical_record":{"source":{"id":"1808.08850","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-08-27T14:02:58Z","cross_cats_sorted":[],"title_canon_sha256":"95709a21b27edecab4b327e6d884b4439a0dc34e545ca60b14052b171b360081","abstract_canon_sha256":"5271759ead9ff167e6bcfa11f1aa89a180e61e37ee4c5392c70345e8d026187c"},"schema_version":"1.0"},"canonical_sha256":"e2a55b9ab3bad698d1d5cfc126e66985c794a8f4a2690283ecc1ff29d36c4b92","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:07:13.048384Z","signature_b64":"jS92p0mRPJiIswqXgB6KZDvjOKJ5I26ls1ro94P7zSgXwhenVuAz8Ti4jpzk92qH5Z34fwMBTask5mYI6UWSBA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"e2a55b9ab3bad698d1d5cfc126e66985c794a8f4a2690283ecc1ff29d36c4b92","last_reissued_at":"2026-05-18T00:07:13.047864Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:07:13.047864Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1808.08850","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:07:13Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"GKJIWh1IXfd/7V8qgleop9McIQtpCeOYZ1E1tlmPKoRifZbsoz5RcbMkx2DcW4fBoyqPmeGY08GqGGXSKzDLBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T06:34:46.465974Z"},"content_sha256":"5b6bfaff9675bd4eed8c5b2cf6c5b7948a0dfcde1330adf1901d11523207a32d","schema_version":"1.0","event_id":"sha256:5b6bfaff9675bd4eed8c5b2cf6c5b7948a0dfcde1330adf1901d11523207a32d"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:4KSVXGVTXLLJRUOVZ7ASNZTJQX","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"WiSeBE: Window-based Sentence Boundary Evaluation","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Carlos-Emiliano Gonz\\'alez-Gallardo, Juan-Manuel Torres-Moreno","submitted_at":"2018-08-27T14:02:58Z","abstract_excerpt":"Sentence Boundary Detection (SBD) has been a major research topic since Automatic Speech Recognition transcripts have been used for further Natural Language Processing tasks like Part of Speech Tagging, Question Answering or Automatic Summarization. But what about evaluation? Do standard evaluation metrics like precision, recall, F-score or classification error; and more important, evaluating an automatic system against a unique reference is enough to conclude how well a SBD system is performing given the final application of the transcript? In this paper we propose Window-based Sentence Bound"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1808.08850","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:07:13Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"cstHTgpuLUUUgRdSVe4t7gmL+Jfk3WY0VaH0t0XryGlVfASUBgBelXBgFh6yQdOL3z/+xoWxIUVyQrl7nXoOCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T06:34:46.466615Z"},"content_sha256":"6bef4968991f7f4ff692b513124e231f740bece750c1d69e2d40c62f85481077","schema_version":"1.0","event_id":"sha256:6bef4968991f7f4ff692b513124e231f740bece750c1d69e2d40c62f85481077"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/4KSVXGVTXLLJRUOVZ7ASNZTJQX/bundle.json","state_url":"https://pith.science/pith/4KSVXGVTXLLJRUOVZ7ASNZTJQX/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/4KSVXGVTXLLJRUOVZ7ASNZTJQX/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-30T06:34:46Z","links":{"resolver":"https://pith.science/pith/4KSVXGVTXLLJRUOVZ7ASNZTJQX","bundle":"https://pith.science/pith/4KSVXGVTXLLJRUOVZ7ASNZTJQX/bundle.json","state":"https://pith.science/pith/4KSVXGVTXLLJRUOVZ7ASNZTJQX/state.json","well_known_bundle":"https://pith.science/.well-known/pith/4KSVXGVTXLLJRUOVZ7ASNZTJQX/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:4KSVXGVTXLLJRUOVZ7ASNZTJQX","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"5271759ead9ff167e6bcfa11f1aa89a180e61e37ee4c5392c70345e8d026187c","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-08-27T14:02:58Z","title_canon_sha256":"95709a21b27edecab4b327e6d884b4439a0dc34e545ca60b14052b171b360081"},"schema_version":"1.0","source":{"id":"1808.08850","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1808.08850","created_at":"2026-05-18T00:07:13Z"},{"alias_kind":"arxiv_version","alias_value":"1808.08850v1","created_at":"2026-05-18T00:07:13Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1808.08850","created_at":"2026-05-18T00:07:13Z"},{"alias_kind":"pith_short_12","alias_value":"4KSVXGVTXLLJ","created_at":"2026-05-18T12:32:05Z"},{"alias_kind":"pith_short_16","alias_value":"4KSVXGVTXLLJRUOV","created_at":"2026-05-18T12:32:05Z"},{"alias_kind":"pith_short_8","alias_value":"4KSVXGVT","created_at":"2026-05-18T12:32:05Z"}],"graph_snapshots":[{"event_id":"sha256:6bef4968991f7f4ff692b513124e231f740bece750c1d69e2d40c62f85481077","target":"graph","created_at":"2026-05-18T00:07:13Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Sentence Boundary Detection (SBD) has been a major research topic since Automatic Speech Recognition transcripts have been used for further Natural Language Processing tasks like Part of Speech Tagging, Question Answering or Automatic Summarization. But what about evaluation? Do standard evaluation metrics like precision, recall, F-score or classification error; and more important, evaluating an automatic system against a unique reference is enough to conclude how well a SBD system is performing given the final application of the transcript? In this paper we propose Window-based Sentence Bound","authors_text":"Carlos-Emiliano Gonz\\'alez-Gallardo, Juan-Manuel Torres-Moreno","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-08-27T14:02:58Z","title":"WiSeBE: Window-based Sentence Boundary Evaluation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1808.08850","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:5b6bfaff9675bd4eed8c5b2cf6c5b7948a0dfcde1330adf1901d11523207a32d","target":"record","created_at":"2026-05-18T00:07:13Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"5271759ead9ff167e6bcfa11f1aa89a180e61e37ee4c5392c70345e8d026187c","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-08-27T14:02:58Z","title_canon_sha256":"95709a21b27edecab4b327e6d884b4439a0dc34e545ca60b14052b171b360081"},"schema_version":"1.0","source":{"id":"1808.08850","kind":"arxiv","version":1}},"canonical_sha256":"e2a55b9ab3bad698d1d5cfc126e66985c794a8f4a2690283ecc1ff29d36c4b92","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e2a55b9ab3bad698d1d5cfc126e66985c794a8f4a2690283ecc1ff29d36c4b92","first_computed_at":"2026-05-18T00:07:13.047864Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:07:13.047864Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"jS92p0mRPJiIswqXgB6KZDvjOKJ5I26ls1ro94P7zSgXwhenVuAz8Ti4jpzk92qH5Z34fwMBTask5mYI6UWSBA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:07:13.048384Z","signed_message":"canonical_sha256_bytes"},"source_id":"1808.08850","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:5b6bfaff9675bd4eed8c5b2cf6c5b7948a0dfcde1330adf1901d11523207a32d","sha256:6bef4968991f7f4ff692b513124e231f740bece750c1d69e2d40c62f85481077"],"state_sha256":"fe6e5cdb94c5ad386015552795437654a2d2cc7e307ff4b2be07d130ed60f0ab"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"FO38WbMbA/8RhTIhBKwqVT0iWyiVtOCqhDIKH16dSePeCY259wm9lujfn6bOGl7+y3c0IC7tOC7RgyTyNvrYCg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-30T06:34:46.469981Z","bundle_sha256":"71569e5ac0d73748b6b924b61f038098b7852125cadb298abcdd2da97a4bdca5"}}