{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:HNGCSZAREOWKECC7ELVQJH66D5","short_pith_number":"pith:HNGCSZAR","canonical_record":{"source":{"id":"1802.04903","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-14T00:28:54Z","cross_cats_sorted":["physics.chem-ph"],"title_canon_sha256":"935b6238d074fadcc6520326b66d2dc8a8e017f1aacc5a0c0213afeea056f5e7","abstract_canon_sha256":"5302c651d0a967ee5b61da1b1c5c9014bd0ca0b2eba14c21175d2b77013b772d"},"schema_version":"1.0"},"canonical_sha256":"3b4c29641123aca2085f22eb049fde1f79cedd921403a90a8e575c63716ea850","source":{"kind":"arxiv","id":"1802.04903","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1802.04903","created_at":"2026-05-18T00:23:22Z"},{"alias_kind":"arxiv_version","alias_value":"1802.04903v1","created_at":"2026-05-18T00:23:22Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1802.04903","created_at":"2026-05-18T00:23:22Z"},{"alias_kind":"pith_short_12","alias_value":"HNGCSZAREOWK","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_16","alias_value":"HNGCSZAREOWKECC7","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_8","alias_value":"HNGCSZAR","created_at":"2026-05-18T12:32:28Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:HNGCSZAREOWKECC7ELVQJH66D5","target":"record","payload":{"canonical_record":{"source":{"id":"1802.04903","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-14T00:28:54Z","cross_cats_sorted":["physics.chem-ph"],"title_canon_sha256":"935b6238d074fadcc6520326b66d2dc8a8e017f1aacc5a0c0213afeea056f5e7","abstract_canon_sha256":"5302c651d0a967ee5b61da1b1c5c9014bd0ca0b2eba14c21175d2b77013b772d"},"schema_version":"1.0"},"canonical_sha256":"3b4c29641123aca2085f22eb049fde1f79cedd921403a90a8e575c63716ea850","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:23:22.261030Z","signature_b64":"T/ddxgcBqMqy/UhsZI/DgKy4R8JK6H7mM63iFtMve3qypVmtPxsoJIWd0OmYHjdZ/sqfigizU668RbVtjBLpAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"3b4c29641123aca2085f22eb049fde1f79cedd921403a90a8e575c63716ea850","last_reissued_at":"2026-05-18T00:23:22.260340Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:23:22.260340Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1802.04903","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:23:22Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"CJz0ufFsguUMpUOcYI/5ouBEBXy15OU589IdbqacU3vIMq8MvnBaTfZS8lEPxygx3+cdODsjKYowTxZ5yhWhAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-28T13:11:08.876546Z"},"content_sha256":"59408642081501474deb4a533615e1b822f43d3d3ddf10f6ea160228783d540c","schema_version":"1.0","event_id":"sha256:59408642081501474deb4a533615e1b822f43d3d3ddf10f6ea160228783d540c"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:HNGCSZAREOWKECC7ELVQJH66D5","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Molecular Structure Extraction From Documents Using Deep Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["physics.chem-ph"],"primary_cat":"cs.LG","authors_text":"Carolyn McQuaw, Joshua Staker, Kyle Marshall, Robert Abel","submitted_at":"2018-02-14T00:28:54Z","abstract_excerpt":"Chemical structure extraction from documents remains a hard problem due to both false positive identification of structures during segmentation and errors in the predicted structures. Current approaches rely on handcrafted rules and subroutines that perform reasonably well generally, but still routinely encounter situations where recognition rates are not yet satisfactory and systematic improvement is challenging. Complications impacting performance of current approaches include the diversity in visual styles used by various software to render structures, the frequent use of ad hoc annotations"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1802.04903","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:23:22Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"qkkRUXjOY4lOJ6nj0zY2uCkkHxzhhgylfLHzt/uRGbtb9DAXJHG9xcjFEmMUANN9SBb1Bcg5DK9ZMk3Mxwv7Cw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-28T13:11:08.876895Z"},"content_sha256":"f4c19581d66340448374a121d9757ebbbe75cbe02ef832b1be90631c4298092f","schema_version":"1.0","event_id":"sha256:f4c19581d66340448374a121d9757ebbbe75cbe02ef832b1be90631c4298092f"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/HNGCSZAREOWKECC7ELVQJH66D5/bundle.json","state_url":"https://pith.science/pith/HNGCSZAREOWKECC7ELVQJH66D5/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/HNGCSZAREOWKECC7ELVQJH66D5/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-28T13:11:08Z","links":{"resolver":"https://pith.science/pith/HNGCSZAREOWKECC7ELVQJH66D5","bundle":"https://pith.science/pith/HNGCSZAREOWKECC7ELVQJH66D5/bundle.json","state":"https://pith.science/pith/HNGCSZAREOWKECC7ELVQJH66D5/state.json","well_known_bundle":"https://pith.science/.well-known/pith/HNGCSZAREOWKECC7ELVQJH66D5/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:HNGCSZAREOWKECC7ELVQJH66D5","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"5302c651d0a967ee5b61da1b1c5c9014bd0ca0b2eba14c21175d2b77013b772d","cross_cats_sorted":["physics.chem-ph"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-14T00:28:54Z","title_canon_sha256":"935b6238d074fadcc6520326b66d2dc8a8e017f1aacc5a0c0213afeea056f5e7"},"schema_version":"1.0","source":{"id":"1802.04903","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1802.04903","created_at":"2026-05-18T00:23:22Z"},{"alias_kind":"arxiv_version","alias_value":"1802.04903v1","created_at":"2026-05-18T00:23:22Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1802.04903","created_at":"2026-05-18T00:23:22Z"},{"alias_kind":"pith_short_12","alias_value":"HNGCSZAREOWK","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_16","alias_value":"HNGCSZAREOWKECC7","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_8","alias_value":"HNGCSZAR","created_at":"2026-05-18T12:32:28Z"}],"graph_snapshots":[{"event_id":"sha256:f4c19581d66340448374a121d9757ebbbe75cbe02ef832b1be90631c4298092f","target":"graph","created_at":"2026-05-18T00:23:22Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Chemical structure extraction from documents remains a hard problem due to both false positive identification of structures during segmentation and errors in the predicted structures. Current approaches rely on handcrafted rules and subroutines that perform reasonably well generally, but still routinely encounter situations where recognition rates are not yet satisfactory and systematic improvement is challenging. Complications impacting performance of current approaches include the diversity in visual styles used by various software to render structures, the frequent use of ad hoc annotations","authors_text":"Carolyn McQuaw, Joshua Staker, Kyle Marshall, Robert Abel","cross_cats":["physics.chem-ph"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-14T00:28:54Z","title":"Molecular Structure Extraction From Documents Using Deep Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1802.04903","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:59408642081501474deb4a533615e1b822f43d3d3ddf10f6ea160228783d540c","target":"record","created_at":"2026-05-18T00:23:22Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"5302c651d0a967ee5b61da1b1c5c9014bd0ca0b2eba14c21175d2b77013b772d","cross_cats_sorted":["physics.chem-ph"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-14T00:28:54Z","title_canon_sha256":"935b6238d074fadcc6520326b66d2dc8a8e017f1aacc5a0c0213afeea056f5e7"},"schema_version":"1.0","source":{"id":"1802.04903","kind":"arxiv","version":1}},"canonical_sha256":"3b4c29641123aca2085f22eb049fde1f79cedd921403a90a8e575c63716ea850","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"3b4c29641123aca2085f22eb049fde1f79cedd921403a90a8e575c63716ea850","first_computed_at":"2026-05-18T00:23:22.260340Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:23:22.260340Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"T/ddxgcBqMqy/UhsZI/DgKy4R8JK6H7mM63iFtMve3qypVmtPxsoJIWd0OmYHjdZ/sqfigizU668RbVtjBLpAQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:23:22.261030Z","signed_message":"canonical_sha256_bytes"},"source_id":"1802.04903","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:59408642081501474deb4a533615e1b822f43d3d3ddf10f6ea160228783d540c","sha256:f4c19581d66340448374a121d9757ebbbe75cbe02ef832b1be90631c4298092f"],"state_sha256":"c6bc133a5e24efa2afd389fbd6356d5b72b35e843b327c4237f757520785844b"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"CIkVW5sXEuf+51hxR6Ha2ESNQbKvNSi2GJBe3Ih2hf5rs39T73TKGJJMt2a2ACYnnbcySUtii8m7Q48jLmWPDQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-28T13:11:08.878964Z","bundle_sha256":"5b4a772bd6f273ecd059266e4b8f4c331ceb40a61770f1d28c5c6244098919dc"}}