{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:SORG75SWWFVIIQOHM5IT3IMNWD","short_pith_number":"pith:SORG75SW","canonical_record":{"source":{"id":"1707.07568","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-07-24T14:20:07Z","cross_cats_sorted":[],"title_canon_sha256":"abb52d294ba5d481eb6b03830f60ef77f883bae210920f23b264a96b29da8c40","abstract_canon_sha256":"e5ff8325664d4dc593104db6f678f3711abc596bb0ca1ac14d26700c0798fc8f"},"schema_version":"1.0"},"canonical_sha256":"93a26ff656b16a8441c767513da18db0f8011bb36a25dfb8768acdade638fda0","source":{"kind":"arxiv","id":"1707.07568","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1707.07568","created_at":"2026-05-18T00:39:41Z"},{"alias_kind":"arxiv_version","alias_value":"1707.07568v1","created_at":"2026-05-18T00:39:41Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1707.07568","created_at":"2026-05-18T00:39:41Z"},{"alias_kind":"pith_short_12","alias_value":"SORG75SWWFVI","created_at":"2026-05-18T12:31:43Z"},{"alias_kind":"pith_short_16","alias_value":"SORG75SWWFVIIQOH","created_at":"2026-05-18T12:31:43Z"},{"alias_kind":"pith_short_8","alias_value":"SORG75SW","created_at":"2026-05-18T12:31:43Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:SORG75SWWFVIIQOHM5IT3IMNWD","target":"record","payload":{"canonical_record":{"source":{"id":"1707.07568","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-07-24T14:20:07Z","cross_cats_sorted":[],"title_canon_sha256":"abb52d294ba5d481eb6b03830f60ef77f883bae210920f23b264a96b29da8c40","abstract_canon_sha256":"e5ff8325664d4dc593104db6f678f3711abc596bb0ca1ac14d26700c0798fc8f"},"schema_version":"1.0"},"canonical_sha256":"93a26ff656b16a8441c767513da18db0f8011bb36a25dfb8768acdade638fda0","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:39:41.814725Z","signature_b64":"J4iXBeZqfWRHY0ZHG6PVgQwPNHNZc8nZ1CwumM3AozlnzkER9I3QxSrPgG6gwPxdIvm4HiyTxAbp1justTFIAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"93a26ff656b16a8441c767513da18db0f8011bb36a25dfb8768acdade638fda0","last_reissued_at":"2026-05-18T00:39:41.814026Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:39:41.814026Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1707.07568","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:39:41Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"76c2tE/b2J6i5D1g4jQ8RVLxDtAem4WEZ2D5Rld4k+/JnIKIRrre2EHoQMdZtwanHiGS1Ptystd42eCyxQaEAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T21:12:05.494678Z"},"content_sha256":"9950590b68df5e718f1d58be86d98121461a13fac34b2268b096887f466b4658","schema_version":"1.0","event_id":"sha256:9950590b68df5e718f1d58be86d98121461a13fac34b2268b096887f466b4658"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:SORG75SWWFVIIQOHM5IT3IMNWD","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"CAp 2017 challenge: Twitter Named Entity Recognition","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Am\\'elie Martin, C\\'edric Lopez, Coralie Reutenauer, Fr\\'ed\\'erique Segond, Georgios Balikas, Ioannis Partalas, Massih-Reza Amini, Nadia Derbas","submitted_at":"2017-07-24T14:20:07Z","abstract_excerpt":"The paper describes the CAp 2017 challenge. The challenge concerns the problem of Named Entity Recognition (NER) for tweets written in French. We first present the data preparation steps we followed for constructing the dataset released in the framework of the challenge. We begin by demonstrating why NER for tweets is a challenging problem especially when the number of entities increases. We detail the annotation process and the necessary decisions we made. We provide statistics on the inter-annotator agreement, and we conclude the data description part with examples and statistics for the dat"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1707.07568","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:39:41Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"R47AOT6yVN5l3siztSOhRbmlnF4Asdj9oygG9Ky/8fXVdJV4DHdrNfPOd5cb8rXJh6qZpqdIlLzsWr5FrhZyDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T21:12:05.495344Z"},"content_sha256":"616c58cff993f330bd6634c45844e9ef052ea06c62e0ef380b3ddd0146ee2df6","schema_version":"1.0","event_id":"sha256:616c58cff993f330bd6634c45844e9ef052ea06c62e0ef380b3ddd0146ee2df6"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/SORG75SWWFVIIQOHM5IT3IMNWD/bundle.json","state_url":"https://pith.science/pith/SORG75SWWFVIIQOHM5IT3IMNWD/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/SORG75SWWFVIIQOHM5IT3IMNWD/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-01T21:12:05Z","links":{"resolver":"https://pith.science/pith/SORG75SWWFVIIQOHM5IT3IMNWD","bundle":"https://pith.science/pith/SORG75SWWFVIIQOHM5IT3IMNWD/bundle.json","state":"https://pith.science/pith/SORG75SWWFVIIQOHM5IT3IMNWD/state.json","well_known_bundle":"https://pith.science/.well-known/pith/SORG75SWWFVIIQOHM5IT3IMNWD/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:SORG75SWWFVIIQOHM5IT3IMNWD","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e5ff8325664d4dc593104db6f678f3711abc596bb0ca1ac14d26700c0798fc8f","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-07-24T14:20:07Z","title_canon_sha256":"abb52d294ba5d481eb6b03830f60ef77f883bae210920f23b264a96b29da8c40"},"schema_version":"1.0","source":{"id":"1707.07568","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1707.07568","created_at":"2026-05-18T00:39:41Z"},{"alias_kind":"arxiv_version","alias_value":"1707.07568v1","created_at":"2026-05-18T00:39:41Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1707.07568","created_at":"2026-05-18T00:39:41Z"},{"alias_kind":"pith_short_12","alias_value":"SORG75SWWFVI","created_at":"2026-05-18T12:31:43Z"},{"alias_kind":"pith_short_16","alias_value":"SORG75SWWFVIIQOH","created_at":"2026-05-18T12:31:43Z"},{"alias_kind":"pith_short_8","alias_value":"SORG75SW","created_at":"2026-05-18T12:31:43Z"}],"graph_snapshots":[{"event_id":"sha256:616c58cff993f330bd6634c45844e9ef052ea06c62e0ef380b3ddd0146ee2df6","target":"graph","created_at":"2026-05-18T00:39:41Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"The paper describes the CAp 2017 challenge. The challenge concerns the problem of Named Entity Recognition (NER) for tweets written in French. We first present the data preparation steps we followed for constructing the dataset released in the framework of the challenge. We begin by demonstrating why NER for tweets is a challenging problem especially when the number of entities increases. We detail the annotation process and the necessary decisions we made. We provide statistics on the inter-annotator agreement, and we conclude the data description part with examples and statistics for the dat","authors_text":"Am\\'elie Martin, C\\'edric Lopez, Coralie Reutenauer, Fr\\'ed\\'erique Segond, Georgios Balikas, Ioannis Partalas, Massih-Reza Amini, Nadia Derbas","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-07-24T14:20:07Z","title":"CAp 2017 challenge: Twitter Named Entity Recognition"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1707.07568","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:9950590b68df5e718f1d58be86d98121461a13fac34b2268b096887f466b4658","target":"record","created_at":"2026-05-18T00:39:41Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e5ff8325664d4dc593104db6f678f3711abc596bb0ca1ac14d26700c0798fc8f","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-07-24T14:20:07Z","title_canon_sha256":"abb52d294ba5d481eb6b03830f60ef77f883bae210920f23b264a96b29da8c40"},"schema_version":"1.0","source":{"id":"1707.07568","kind":"arxiv","version":1}},"canonical_sha256":"93a26ff656b16a8441c767513da18db0f8011bb36a25dfb8768acdade638fda0","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"93a26ff656b16a8441c767513da18db0f8011bb36a25dfb8768acdade638fda0","first_computed_at":"2026-05-18T00:39:41.814026Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:39:41.814026Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"J4iXBeZqfWRHY0ZHG6PVgQwPNHNZc8nZ1CwumM3AozlnzkER9I3QxSrPgG6gwPxdIvm4HiyTxAbp1justTFIAA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:39:41.814725Z","signed_message":"canonical_sha256_bytes"},"source_id":"1707.07568","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:9950590b68df5e718f1d58be86d98121461a13fac34b2268b096887f466b4658","sha256:616c58cff993f330bd6634c45844e9ef052ea06c62e0ef380b3ddd0146ee2df6"],"state_sha256":"d4db1de574fa90a0bb6baf5753959bca79473af21700366dd09292e79c6ea943"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"FJLiDPGFDht5L7ATMPyrhn/KXHYJzhPH2N5CKzhBcxcLzqIwbHoQym7ghZVcTgXVyq71+8P8xD17sDlzHtadBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-01T21:12:05.498536Z","bundle_sha256":"93ef5c1565248c103a52903dc7aa1e7a77519c349ed87a19c1fef8df1b17c253"}}