{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:E6GED7ZF3D3A277E2EU2EN25FS","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"52bfcb213127f5509cc4e89bfe7ff4a8c52abe28cc81ba8f8f0d7a4dedbeca8f","cross_cats_sorted":["cs.AI","cs.MA"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2026-02-14T14:52:36Z","title_canon_sha256":"c9d1d37221f899622fb9d25569718ff818ce14dfe0be59451bffcb9509cfb318"},"schema_version":"1.0","source":{"id":"2602.13812","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2602.13812","created_at":"2026-06-01T02:03:35Z"},{"alias_kind":"arxiv_version","alias_value":"2602.13812v3","created_at":"2026-06-01T02:03:35Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2602.13812","created_at":"2026-06-01T02:03:35Z"},{"alias_kind":"pith_short_12","alias_value":"E6GED7ZF3D3A","created_at":"2026-06-01T02:03:35Z"},{"alias_kind":"pith_short_16","alias_value":"E6GED7ZF3D3A277E","created_at":"2026-06-01T02:03:35Z"},{"alias_kind":"pith_short_8","alias_value":"E6GED7ZF","created_at":"2026-06-01T02:03:35Z"}],"graph_snapshots":[{"event_id":"sha256:96134ffe3eddc17a8862cd069d84df0eb9a0d91ed47887b9f1749d1a4794a038","target":"graph","created_at":"2026-06-01T02:03:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2602.13812/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Document-to-table (Doc2Table) extraction derives structured tables from unstructured documents under a target schema, enabling reliable and verifiable SQL-based data analytics. Although large language models (LLMs) have shown promise in flexible information extraction, their ability to produce precisely structured tables remains insufficiently understood, particularly for indirect extraction that requires complex capabilities such as reasoning and conflict resolution. Existing benchmarks neither explicitly distinguish nor comprehensively cover the diverse capabilities required in Doc2Table ext","authors_text":"Congcong Ge, Kezheng Tang, Nan Tang, Yunjun Gao, Yuxiang Guo, Zhuoran Du","cross_cats":["cs.AI","cs.MA"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2026-02-14T14:52:36Z","title":"DTBench: A Synthetic Benchmark for Document-to-Table Extraction"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2602.13812","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:59f481a60ed2ea086508f404bfad07a81e34d6d9f2374464fac13fe83100cd8c","target":"record","created_at":"2026-06-01T02:03:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"52bfcb213127f5509cc4e89bfe7ff4a8c52abe28cc81ba8f8f0d7a4dedbeca8f","cross_cats_sorted":["cs.AI","cs.MA"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2026-02-14T14:52:36Z","title_canon_sha256":"c9d1d37221f899622fb9d25569718ff818ce14dfe0be59451bffcb9509cfb318"},"schema_version":"1.0","source":{"id":"2602.13812","kind":"arxiv","version":3}},"canonical_sha256":"278c41ff25d8f60d7fe4d129a2375d2ca0e9408f993c952fb8a6cd26a5784e95","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"278c41ff25d8f60d7fe4d129a2375d2ca0e9408f993c952fb8a6cd26a5784e95","first_computed_at":"2026-06-01T02:03:35.245600Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-01T02:03:35.245600Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"KW5D1PLQCqhrPCHcUyPm/yv8NeD7N7HGJ7RHKdd/XvRSII8HEQH5Un562nTL9uQ42BoyozADYmdHYkNljBpoAQ==","signature_status":"signed_v1","signed_at":"2026-06-01T02:03:35.246558Z","signed_message":"canonical_sha256_bytes"},"source_id":"2602.13812","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:59f481a60ed2ea086508f404bfad07a81e34d6d9f2374464fac13fe83100cd8c","sha256:96134ffe3eddc17a8862cd069d84df0eb9a0d91ed47887b9f1749d1a4794a038"],"state_sha256":"84ef3753a37329d0c5c44b68242d8b96a88c1069f08a8f60a0a89b1686a35bea"}